| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643 |
- //
- // Copyright (c) 2019 Vinnie Falco (vinnie.falco@gmail.com)
- //
- // Distributed under the Boost Software License, Version 1.0. (See accompanying
- // file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
- //
- // Official repository: https://github.com/boostorg/json
- //
- #ifndef BOOST_JSON_STREAM_PARSER_HPP
- #define BOOST_JSON_STREAM_PARSER_HPP
- #include <boost/json/detail/config.hpp>
- #include <boost/json/basic_parser.hpp>
- #include <boost/json/parse_options.hpp>
- #include <boost/json/storage_ptr.hpp>
- #include <boost/json/value.hpp>
- #include <boost/json/detail/handler.hpp>
- #include <type_traits>
- #include <cstddef>
- namespace boost {
- namespace json {
- //----------------------------------------------------------
- /** A DOM parser for JSON text contained in multiple buffers.
- This class is used to parse a JSON text contained in a series of one or
- more character buffers, into a @ref value container. It implements a
- [_streaming algorithm_](https://en.wikipedia.org/wiki/Streaming_algorithm),
- allowing these parsing strategies:
- @li parse a JSON file a piece at a time;
- @li parse incoming JSON text as it arrives, one buffer at a time;
- @li parse with bounded resource consumption per cycle.
- @par Usage
- To use the parser first construct it, then optionally call @ref reset to
- specify a @ref storage_ptr to use for the resulting @ref value. Then call
- @ref write one or more times to parse a single, complete JSON text. Call
- @ref done to determine if the parse has completed. To indicate there are no
- more buffers, call @ref finish. If the parse is successful, call @ref
- release to take ownership of the value:
- @code
- stream_parser p; // construct a parser
- p.write( "[1,2" ); // parse some of a JSON text
- p.write( ",3,4]" ); // parse the rest of the JSON text
- assert( p.done() ); // we have a complete JSON text
- value jv = p.release(); // take ownership of the value
- @endcode
- @par Extra Data
- When the character buffer provided as input contains additional data that
- is not part of the complete JSON text, an error is returned. The @ref
- write_some function is an alternative which allows the parse to finish
- early, without consuming all the characters in the buffer. This allows
- parsing of a buffer containing multiple individual JSON texts or containing
- different protocol data:
- @code
- stream_parser p; // construct a parser
- std::size_t n; // number of characters used
- n = p.write_some( "[1,2" ); // parse some of a JSON text
- assert( n == 4 ); // all characters consumed
- n = p.write_some( ",3,4] null" ); // parse the remainder of the JSON text
- assert( n == 6 ); // only some characters consumed
- assert( p.done() ); // we have a complete JSON text
- value jv = p.release(); // take ownership of the value
- @endcode
- @par Temporary Storage
- The parser may dynamically allocate temporary storage as needed to
- accommodate the nesting level of the JSON text being parsed. Temporary
- storage is first obtained from an optional, caller-owned buffer specified
- upon construction. When that is exhausted, the next allocation uses the
- @ref boost::container::pmr::memory_resource passed to the constructor; if
- no such argument is specified, the default memory resource is used.
- Temporary storage is freed only when the parser is destroyed; The
- performance of parsing multiple JSON texts may be improved by reusing the
- same parser instance.
- It is important to note that the @ref
- boost::container::pmr::memory_resource supplied upon construction is used
- for temporary storage only, and not for allocating the elements which make
- up the parsed value. That other memory resource is optionally supplied in
- each call to @ref reset.
- @par Duplicate Keys
- If there are object elements with duplicate keys; that is, if multiple
- elements in an object have keys that compare equal, only the last
- equivalent element will be inserted.
- @par Non-Standard JSON
- The @ref parse_options structure optionally provided upon construction is
- used to customize some parameters of the parser, including which
- non-standard JSON extensions should be allowed. A default-constructed parse
- options allows only standard JSON.
- @par Thread Safety
- Distinct instances may be accessed concurrently. Non-const member functions
- of a shared instance may not be called concurrently with any other member
- functions of that instance.
- @see @ref parse, @ref parser, @ref parse_options.
- */
- class stream_parser
- {
- basic_parser<detail::handler> p_;
- public:
- /** Destructor.
- All dynamically allocated memory, including
- any incomplete parsing results, is freed.
- @par Complexity
- Linear in the size of partial results
- @par Exception Safety
- No-throw guarantee.
- */
- ~stream_parser() = default;
- /** Constructors.
- Construct a new parser.
- The parser will only support standard JSON if overloads **(1)**
- or **(2)** are used. Otherwise the parser will support extensions
- specified by the parameter `opt`.
- The parsed value will use the \<\<default_memory_resource,default
- memory resource\>\> for storage. To use a different resource, call @ref
- reset after construction.
- The main difference between the overloads is in what the constructed
- parser will use for temporary storage:
- @li **(1)** the constructed parser uses the default memory resource for
- temporary storage.
- @li **(2)**, **(3)** the constructed parser uses the memory resource of
- `sp` for temporary storage.
- @li **(4)**, **(6)** the constructed parser first uses the caller-owned
- storage `[buffer, buffer + size)` for temporary storage, falling back
- to the memory resource of `sp` if needed.
- @li **(5)**, **(7)** the constructed parser first uses the caller-owned
- storage `[buffer, buffer + N)` for temporary storage, falling back to
- the memory resource of `sp` if needed.
- @note Ownership of `buffer` is not transferred. The caller is
- responsible for ensuring the lifetime of the storage pointed to by
- `buffer` extends until the parser is destroyed.
- Overload **(8)** is the copy constructor. The type is neither copyable
- nor movable, so the overload is deleted.
- @par Complexity
- Constant.
- @par Exception Safety
- No-throw guarantee.
- @{
- */
- stream_parser() noexcept
- : stream_parser({}, {})
- {
- }
- /** Overload
- @param sp The memory resource to use for temporary storage.
- */
- explicit
- stream_parser(storage_ptr sp) noexcept
- : stream_parser(std::move(sp), {})
- {
- }
- /** Overload
- @param opt The parsing options to use.
- @param sp
- */
- BOOST_JSON_DECL
- stream_parser(
- storage_ptr sp,
- parse_options const& opt) noexcept;
- /** Overload
- @param buffer A pointer to valid storage.
- @param size The number of valid bytes in `buffer`.
- @param sp
- @param opt
- */
- BOOST_JSON_DECL
- stream_parser(
- storage_ptr sp,
- parse_options const& opt,
- unsigned char* buffer,
- std::size_t size) noexcept;
- /** Overload
- @tparam N The number of valid bytes in `buffer`.
- @param sp
- @param opt
- @param buffer
- */
- template<std::size_t N>
- stream_parser(
- storage_ptr sp,
- parse_options const& opt,
- unsigned char(&buffer)[N]) noexcept
- : stream_parser(std::move(sp),
- opt, &buffer[0], N)
- {
- }
- #if defined(__cpp_lib_byte) || defined(BOOST_JSON_DOCS)
- /** Overload
- @param sp
- @param opt
- @param buffer
- @param size
- */
- stream_parser(
- storage_ptr sp,
- parse_options const& opt,
- std::byte* buffer,
- std::size_t size) noexcept
- : stream_parser(sp, opt, reinterpret_cast<
- unsigned char*>(buffer), size)
- {
- }
- /** Overload
- @tparam N
- @param sp
- @param opt
- @param buffer
- */
- template<std::size_t N>
- stream_parser(
- storage_ptr sp,
- parse_options const& opt,
- std::byte(&buffer)[N]) noexcept
- : stream_parser(std::move(sp),
- opt, &buffer[0], N)
- {
- }
- #endif
- #ifndef BOOST_JSON_DOCS
- // Safety net for accidental buffer overflows
- template<std::size_t N>
- stream_parser(
- storage_ptr sp,
- parse_options const& opt,
- unsigned char(&buffer)[N],
- std::size_t n) noexcept
- : stream_parser(std::move(sp),
- opt, &buffer[0], n)
- {
- // If this goes off, check your parameters
- // closely, chances are you passed an array
- // thinking it was a pointer.
- BOOST_ASSERT(n <= N);
- }
- #ifdef __cpp_lib_byte
- // Safety net for accidental buffer overflows
- template<std::size_t N>
- stream_parser(
- storage_ptr sp,
- parse_options const& opt,
- std::byte(&buffer)[N], std::size_t n) noexcept
- : stream_parser(std::move(sp),
- opt, &buffer[0], n)
- {
- // If this goes off, check your parameters
- // closely, chances are you passed an array
- // thinking it was a pointer.
- BOOST_ASSERT(n <= N);
- }
- #endif
- #endif
- /// Overload
- stream_parser(
- stream_parser const&) = delete;
- /// @}
- /** Assignment operator.
- This type is neither copyable nor movable, so copy assignment operator
- is deleted.
- */
- stream_parser& operator=(
- stream_parser const&) = delete;
- /** Reset the parser for a new JSON text.
- This function is used to reset the parser to prepare it for parsing
- a new complete JSON text. Any previous partial results are destroyed.
- The new value will use the memory resource of `sp`.
- @par Complexity
- Constant or linear in the size of any previous partial parsing results.
- @par Exception Safety
- No-throw guarantee.
- @param sp A pointer to the @ref boost::container::pmr::memory_resource.
- */
- BOOST_JSON_DECL
- void
- reset(storage_ptr sp = {}) noexcept;
- /** Check if a complete JSON text has been parsed.
- This function returns `true` when all of these conditions are met:
- @li A complete serialized JSON text has been presented to the parser,
- and
- @li No error has occurred since the parser was constructed, or since
- the last call to @ref reset,
- @par Complexity
- Constant.
- @par Exception Safety
- No-throw guarantee.
- */
- bool
- done() const noexcept
- {
- return p_.done();
- }
- /** Parse a buffer containing all or part of a complete JSON text.
- This function parses JSON text contained in the specified character
- buffer. If parsing completes, any additional characters past the end of
- the complete JSON text are ignored. The function returns the actual
- number of characters parsed, which may be less than the size of the
- input. This allows parsing of a buffer containing multiple individual
- JSON texts or containing different protocol data.
- Overloads **(1)**, **(2)**, **(4)**, and **(5)** report errors by
- setting `ec`. Overloads **(3)** and **(6)** report errors by throwing
- exceptions. Upon error or exception, subsequent calls will fail until
- @ref reset is called to parse a new JSON text.
- @note To indicate there are no more character buffers, such as when
- @ref done returns `false` after writing, call @ref finish.
- @par Example
- @code
- stream_parser p; // construct a parser
- std::size_t n; // number of characters used
- n = p.write_some( "[1,2" ); // parse the first part of the JSON text
- assert( n == 4 ); // all characters consumed
- n = p.write_some( "3,4] null" ); // parse the rest of the JSON text
- assert( n == 5 ); // only some characters consumed
- value jv = p.release(); // take ownership of the value
- @endcode
- @par Complexity
- @li **(1)**--**(3)** linear in `size`.
- @li **(4)**--**(6)** linear in `s.size()`.
- @par Exception Safety
- Basic guarantee. Calls to `memory_resource::allocate` may throw.
- @return The number of characters consumed from the buffer.
- @param data A pointer to a buffer of `size` characters to parse.
- @param size The number of characters pointed to by `data`.
- @param ec Set to the error, if any occurred.
- @{
- */
- BOOST_JSON_DECL
- std::size_t
- write_some(
- char const* data,
- std::size_t size,
- system::error_code& ec);
- BOOST_JSON_DECL
- std::size_t
- write_some(
- char const* data,
- std::size_t size,
- std::error_code& ec);
- /** Overload
- @param data
- @param size
- @throw boost::system::system_error Thrown on error.
- */
- BOOST_JSON_DECL
- std::size_t
- write_some(
- char const* data,
- std::size_t size);
- /** Overload
- @param s The character string to parse.
- @param ec
- */
- std::size_t
- write_some(
- string_view s,
- system::error_code& ec)
- {
- return write_some(
- s.data(), s.size(), ec);
- }
- /** Overload
- @param s
- @param ec
- */
- std::size_t
- write_some(
- string_view s,
- std::error_code& ec)
- {
- return write_some(
- s.data(), s.size(), ec);
- }
- /** Overload
- @param s
- */
- std::size_t
- write_some(
- string_view s)
- {
- return write_some(
- s.data(), s.size());
- }
- /// @}
- /** Parse a buffer containing all or part of a complete JSON text.
- This function parses all or part of a JSON text contained in the
- specified character buffer. The entire buffer must be consumed; if
- there are additional characters past the end of the complete JSON text,
- the parse fails and an error is returned.
- Overloads **(1)**, **(2)**, **(4)**, and **(5)** report errors by
- setting `ec`. Overloads **(3)** and **(6)** report errors by throwing
- exceptions. Upon error or exception, subsequent calls will fail until
- @ref reset is called to parse a new JSON text.
- @note To indicate there are no more character buffers, such as when
- @ref done returns `false` after writing, call @ref finish.
- @par Example
- @code
- stream_parser p; // construct a parser
- std::size_t n; // number of characters used
- n = p.write( "[1,2" ); // parse some of the JSON text
- assert( n == 4 ); // all characters consumed
- n = p.write( "3,4]" ); // parse the rest of the JSON text
- assert( n == 4 ); // all characters consumed
- value jv = p.release(); // take ownership of the value
- @endcode
- @par Complexity
- @li **(1)**--**(3)** linear in `size`.
- @li **(4)**--**(6)** linear in `s.size()`.
- @par Exception Safety
- Basic guarantee. Calls to `memory_resource::allocate` may throw.
- @return The number of characters consumed from the buffer.
- @param data A pointer to a buffer of `size` characters to parse.
- @param size The number of characters pointed to by `data`.
- @param ec Set to the error, if any occurred.
- @{
- */
- BOOST_JSON_DECL
- std::size_t
- write(
- char const* data,
- std::size_t size,
- system::error_code& ec);
- BOOST_JSON_DECL
- std::size_t
- write(
- char const* data,
- std::size_t size,
- std::error_code& ec);
- /** Overload
- @param data
- @param size
- @throw boost::system::system_error Thrown on error.
- */
- BOOST_JSON_DECL
- std::size_t
- write(
- char const* data,
- std::size_t size);
- /** Overload
- @param s The character string to parse.
- @param ec
- */
- std::size_t
- write(
- string_view s,
- system::error_code& ec)
- {
- return write(
- s.data(), s.size(), ec);
- }
- /** Overload
- @param s
- @param ec
- */
- std::size_t
- write(
- string_view s,
- std::error_code& ec)
- {
- return write(
- s.data(), s.size(), ec);
- }
- /** Overload
- @param s
- */
- std::size_t
- write(
- string_view s)
- {
- return write(
- s.data(), s.size());
- }
- /// @}
- /** Indicate the end of JSON input.
- This function is used to indicate that there are no more character
- buffers in the current JSON text being parsed. If the resulting JSON
- text is incomplete, **(1)** and **(2)** assign the relevant
- `error_code` to `ec`, while **(3)** throws an exception.
- Upon error or exception, subsequent calls will fail until @ref reset is
- called to parse a new JSON text.
- @par Example
- In the code below, @ref finish is called to
- indicate there are no more digits in the
- resulting number:
- @code
- stream_parser p; // construct a parser
- p.write( "3." ); // write the first part of the number
- p.write( "14" ); // write the second part of the number
- assert( ! p.done() ); // there could be more digits
- p.finish(); // indicate the end of the JSON input
- assert( p.done() ); // now we are finished
- value jv = p.release(); // take ownership of the value
- @endcode
- @par Complexity
- Constant.
- @par Exception Safety
- Basic guarantee. Calls to `memory_resource::allocate` may throw.
- @param ec Set to the error, if any occurred.
- @{
- */
- BOOST_JSON_DECL
- void
- finish(system::error_code& ec);
- BOOST_JSON_DECL
- void
- finish(std::error_code& ec);
- /** Overload
- @throw boost::system::system_error Parsing error.
- */
- BOOST_JSON_DECL
- void
- finish();
- /// @}
- /** Return the parsed JSON as a @ref value.
- This returns the parsed value, or throws an exception if the parsing is
- incomplete or failed. If `! this->done()`, calls @ref finish() first.
- It is necessary to call @ref reset after calling this function in order
- to parse another JSON text.
- @par Complexity
- Constant.
- @return The parsed value. Ownership of this value is transferred to the
- caller.
- @throw boost::system::system_error A complete JSON text hasn't been
- parsed, or parsing failed.
- */
- BOOST_JSON_DECL
- value
- release();
- };
- } // namespace json
- } // namespace boost
- #endif
|