2022-07-20 18:38:07 +08:00
|
|
|
// __ _____ _____ _____
|
|
|
|
// __| | __| | | | JSON for Modern C++
|
|
|
|
// | | |__ | | | | | | version 3.10.5
|
|
|
|
// |_____|_____|_____|_|___| https://github.com/nlohmann/json
|
|
|
|
//
|
|
|
|
// SPDX-FileCopyrightText: 2013-2022 Niels Lohmann <https://nlohmann.me>
|
|
|
|
// SPDX-License-Identifier: MIT
|
|
|
|
|
2018-01-10 17:18:31 +08:00
|
|
|
#pragma once
|
2017-08-14 22:48:55 +08:00
|
|
|
|
2019-03-17 07:27:44 +08:00
|
|
|
#include <array> // array
|
2017-08-15 01:28:01 +08:00
|
|
|
#include <cstddef> // size_t
|
|
|
|
#include <cstring> // strlen
|
|
|
|
#include <iterator> // begin, end, iterator_traits, random_access_iterator_tag, distance, next
|
|
|
|
#include <memory> // shared_ptr, make_shared, addressof
|
|
|
|
#include <numeric> // accumulate
|
|
|
|
#include <string> // string, char_traits
|
|
|
|
#include <type_traits> // enable_if, is_base_of, is_pointer, is_integral, remove_pointer
|
|
|
|
#include <utility> // pair, declval
|
2017-08-14 22:48:55 +08:00
|
|
|
|
2021-05-31 20:26:45 +08:00
|
|
|
#ifndef JSON_NO_IO
|
2021-07-19 22:56:28 +08:00
|
|
|
#include <cstdio> // FILE *
|
2021-05-31 20:26:45 +08:00
|
|
|
#include <istream> // istream
|
|
|
|
#endif // JSON_NO_IO
|
|
|
|
|
2019-01-13 22:31:22 +08:00
|
|
|
#include <nlohmann/detail/iterators/iterator_traits.hpp>
|
2018-01-29 18:21:11 +08:00
|
|
|
#include <nlohmann/detail/macro_scope.hpp>
|
2017-08-14 22:48:55 +08:00
|
|
|
|
|
|
|
namespace nlohmann
|
|
|
|
{
|
|
|
|
namespace detail
|
|
|
|
{
|
2018-03-21 05:39:08 +08:00
|
|
|
/// the supported input formats
|
Support UBJSON-derived Binary JData (BJData) format (#3336)
* support UBJSON-derived Binary JData (BJData) format
* fix Codacy warning
* partially fix VS compilation errors
* fix additional VS errors
* fix more VS compilation errors
* fix additional warnings and errors for clang and msvc
* add more tests to cover the new bjdata types
* add tests for optimized ndarray, improve coverage, fix clang/gcc warnings
* gcc warn useless conversion but msvc gives an error
* fix ci_test errors
* complete test coverage, fix ci_test errors
* add half precision error test
* fix No newline at end of file error by clang
* simplify endian condition, format unit-bjdata
* remove broken test due to alloc limit
* full coverage, I hope
* move bjdata new markers from default to the same level as ubjson markers
* fix ci errors, add tests for new bjdata switch structure
* make is_bjdata const after using initializer list
* remove the unwanted assert
* move is_bjdata to an optional param to write_ubjson
* pass use_bjdata via output adapter
* revert order to avoid msvc 2015 unreferenced formal param error
* update BJData Spect V1 Draft-2 URL after spec release
* amalgamate code
* code polishing following @gregmarr's feedback
* make use_bjdata a non-default parameter
* fix ci error, remove unwanted param comment
* encode and decode bjdata ndarray in jdata annotations, enable roundtrip tests
* partially fix ci errors, add tests to improve coverage
* polish patch to remove ci errors
* fix a ndarray dim vector condition
* fix clang tidy error
* add sax test cases for ndarray
* add additional sax event tests
* adjust sax event numbering
* fix sax tests
* ndarray can only be used with array containers, discard if used in object
* complete test coverage
* disable [{SHTFNZ in optimized type due to security risks in #2793 and hampered readability
* fix ci error
* move OutputIsLittleEndian from tparam to param to replace use_bjdata
* fix ci clang gcc error
* fix ci static analysis error
* update json_test_data to 3.1.0, enable file-based bjdata unit tests
* fix stack overflow error on msvc 2019 and 2022
* use https link, update sax_parse_error after rebase
* make input_format const and use initializer
* return bool for write_bjdata_ndarray
* test write_bjdata_ndarray return value as boolean
* fix ci error
2022-04-30 03:17:30 +08:00
|
|
|
enum class input_format_t { json, cbor, msgpack, ubjson, bson, bjdata };
|
2018-03-21 05:39:08 +08:00
|
|
|
|
2017-08-14 22:48:55 +08:00
|
|
|
////////////////////
|
|
|
|
// input adapters //
|
|
|
|
////////////////////
|
|
|
|
|
2021-04-21 16:24:01 +08:00
|
|
|
#ifndef JSON_NO_IO
|
2018-12-12 22:28:42 +08:00
|
|
|
/*!
|
|
|
|
Input adapter for stdio file access. This adapter read only 1 byte and do not use any
|
2018-12-13 03:15:49 +08:00
|
|
|
buffer. This adapter is a very low level adapter.
|
2018-12-12 22:28:42 +08:00
|
|
|
*/
|
2020-02-20 03:59:31 +08:00
|
|
|
class file_input_adapter
|
2018-12-12 02:17:13 +08:00
|
|
|
{
|
2018-12-12 23:18:37 +08:00
|
|
|
public:
|
2020-05-28 00:40:04 +08:00
|
|
|
using char_type = char;
|
|
|
|
|
2019-07-02 04:37:30 +08:00
|
|
|
JSON_HEDLEY_NON_NULL(2)
|
2020-07-16 20:45:39 +08:00
|
|
|
explicit file_input_adapter(std::FILE* f) noexcept
|
2018-12-13 05:33:25 +08:00
|
|
|
: m_file(f)
|
2022-07-23 07:26:51 +08:00
|
|
|
{
|
|
|
|
JSON_ASSERT(m_file != nullptr);
|
|
|
|
}
|
2018-12-12 02:17:13 +08:00
|
|
|
|
2019-03-17 19:01:49 +08:00
|
|
|
// make class move-only
|
|
|
|
file_input_adapter(const file_input_adapter&) = delete;
|
2021-03-24 14:15:18 +08:00
|
|
|
file_input_adapter(file_input_adapter&&) noexcept = default;
|
2019-03-17 19:01:49 +08:00
|
|
|
file_input_adapter& operator=(const file_input_adapter&) = delete;
|
2020-03-03 12:50:01 +08:00
|
|
|
file_input_adapter& operator=(file_input_adapter&&) = delete;
|
2021-03-24 14:15:18 +08:00
|
|
|
~file_input_adapter() = default;
|
2019-03-17 19:01:49 +08:00
|
|
|
|
2020-02-20 03:59:31 +08:00
|
|
|
std::char_traits<char>::int_type get_character() noexcept
|
2018-12-12 02:17:13 +08:00
|
|
|
{
|
2018-12-13 05:33:25 +08:00
|
|
|
return std::fgetc(m_file);
|
2018-12-12 02:17:13 +08:00
|
|
|
}
|
2019-03-17 19:01:49 +08:00
|
|
|
|
2018-12-12 23:18:37 +08:00
|
|
|
private:
|
2018-12-12 02:17:13 +08:00
|
|
|
/// the file pointer to read from
|
2018-12-13 05:33:25 +08:00
|
|
|
std::FILE* m_file;
|
2018-12-12 02:17:13 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
|
2017-08-14 22:48:55 +08:00
|
|
|
/*!
|
|
|
|
Input adapter for a (caching) istream. Ignores a UFT Byte Order Mark at
|
|
|
|
beginning of input. Does not support changing the underlying std::streambuf
|
|
|
|
in mid-input. Maintains underlying std::istream and std::streambuf to support
|
|
|
|
subsequent use of standard std::istream operations to process any input
|
|
|
|
characters following those used in parsing the JSON input. Clears the
|
|
|
|
std::istream flags; any input errors (e.g., EOF) will be detected by the first
|
|
|
|
subsequent call for input from the std::istream.
|
|
|
|
*/
|
2020-02-20 03:59:31 +08:00
|
|
|
class input_stream_adapter
|
2017-08-14 22:48:55 +08:00
|
|
|
{
|
|
|
|
public:
|
2020-05-28 00:40:04 +08:00
|
|
|
using char_type = char;
|
|
|
|
|
2020-02-20 03:59:31 +08:00
|
|
|
~input_stream_adapter()
|
2017-08-14 22:48:55 +08:00
|
|
|
{
|
|
|
|
// clear stream flags; we use underlying streambuf I/O, do not
|
2018-11-07 23:02:50 +08:00
|
|
|
// maintain ifstream flags, except eof
|
2020-06-23 04:32:21 +08:00
|
|
|
if (is != nullptr)
|
2020-02-20 03:59:31 +08:00
|
|
|
{
|
|
|
|
is->clear(is->rdstate() & std::ios::eofbit);
|
|
|
|
}
|
2017-08-14 22:48:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
explicit input_stream_adapter(std::istream& i)
|
2020-02-20 03:59:31 +08:00
|
|
|
: is(&i), sb(i.rdbuf())
|
2018-04-03 03:10:48 +08:00
|
|
|
{}
|
2017-08-14 22:48:55 +08:00
|
|
|
|
|
|
|
// delete because of pointer members
|
|
|
|
input_stream_adapter(const input_stream_adapter&) = delete;
|
|
|
|
input_stream_adapter& operator=(input_stream_adapter&) = delete;
|
2021-03-24 14:15:18 +08:00
|
|
|
input_stream_adapter& operator=(input_stream_adapter&&) = delete;
|
2020-02-20 03:59:31 +08:00
|
|
|
|
2021-03-24 14:15:18 +08:00
|
|
|
input_stream_adapter(input_stream_adapter&& rhs) noexcept
|
|
|
|
: is(rhs.is), sb(rhs.sb)
|
2020-02-20 03:59:31 +08:00
|
|
|
{
|
|
|
|
rhs.is = nullptr;
|
|
|
|
rhs.sb = nullptr;
|
|
|
|
}
|
|
|
|
|
2017-08-14 22:48:55 +08:00
|
|
|
// std::istream/std::streambuf use std::char_traits<char>::to_int_type, to
|
|
|
|
// ensure that std::char_traits<char>::eof() and the character 0xFF do not
|
2021-12-29 20:41:01 +08:00
|
|
|
// end up as the same value, e.g. 0xFFFFFFFF.
|
2020-02-20 03:59:31 +08:00
|
|
|
std::char_traits<char>::int_type get_character()
|
2017-08-14 22:48:55 +08:00
|
|
|
{
|
2020-02-20 03:59:31 +08:00
|
|
|
auto res = sb->sbumpc();
|
2018-11-07 23:02:50 +08:00
|
|
|
// set eof manually, as we don't use the istream interface.
|
2021-05-04 16:22:34 +08:00
|
|
|
if (JSON_HEDLEY_UNLIKELY(res == std::char_traits<char>::eof()))
|
2018-11-10 04:10:32 +08:00
|
|
|
{
|
2020-02-20 03:59:31 +08:00
|
|
|
is->clear(is->rdstate() | std::ios::eofbit);
|
2018-11-10 04:10:32 +08:00
|
|
|
}
|
2018-11-07 23:02:50 +08:00
|
|
|
return res;
|
2017-08-14 22:48:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
/// the associated input stream
|
2020-02-20 03:59:31 +08:00
|
|
|
std::istream* is = nullptr;
|
|
|
|
std::streambuf* sb = nullptr;
|
2017-08-14 22:48:55 +08:00
|
|
|
};
|
2021-04-21 16:24:01 +08:00
|
|
|
#endif // JSON_NO_IO
|
2017-08-14 22:48:55 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
// General-purpose iterator-based adapter. It might not be as fast as
|
|
|
|
// theoretically possible for some containers, but it is extremely versatile.
|
|
|
|
template<typename IteratorType>
|
|
|
|
class iterator_input_adapter
|
2017-08-14 22:48:55 +08:00
|
|
|
{
|
|
|
|
public:
|
2020-05-28 00:40:04 +08:00
|
|
|
using char_type = typename std::iterator_traits<IteratorType>::value_type;
|
2017-08-14 22:48:55 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
iterator_input_adapter(IteratorType first, IteratorType last)
|
2021-03-24 14:15:18 +08:00
|
|
|
: current(std::move(first)), end(std::move(last))
|
|
|
|
{}
|
2017-08-14 22:48:55 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
typename std::char_traits<char_type>::int_type get_character()
|
2017-08-14 22:48:55 +08:00
|
|
|
{
|
2020-05-28 14:29:53 +08:00
|
|
|
if (JSON_HEDLEY_LIKELY(current != end))
|
2017-08-14 22:48:55 +08:00
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
auto result = std::char_traits<char_type>::to_int_type(*current);
|
|
|
|
std::advance(current, 1);
|
|
|
|
return result;
|
|
|
|
}
|
2021-01-27 19:54:46 +08:00
|
|
|
|
|
|
|
return std::char_traits<char_type>::eof();
|
2017-08-14 22:48:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
2020-05-28 00:40:04 +08:00
|
|
|
IteratorType current;
|
|
|
|
IteratorType end;
|
|
|
|
|
|
|
|
template<typename BaseInputAdapter, size_t T>
|
2020-05-29 00:20:02 +08:00
|
|
|
friend struct wide_string_input_helper;
|
2020-05-28 00:40:04 +08:00
|
|
|
|
|
|
|
bool empty() const
|
|
|
|
{
|
|
|
|
return current == end;
|
|
|
|
}
|
2017-08-14 22:48:55 +08:00
|
|
|
};
|
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
|
|
|
|
template<typename BaseInputAdapter, size_t T>
|
|
|
|
struct wide_string_input_helper;
|
|
|
|
|
|
|
|
template<typename BaseInputAdapter>
|
|
|
|
struct wide_string_input_helper<BaseInputAdapter, 4>
|
2018-04-02 01:12:36 +08:00
|
|
|
{
|
2018-10-03 20:51:49 +08:00
|
|
|
// UTF-32
|
2020-05-28 00:40:04 +08:00
|
|
|
static void fill_buffer(BaseInputAdapter& input,
|
2019-03-17 07:27:44 +08:00
|
|
|
std::array<std::char_traits<char>::int_type, 4>& utf8_bytes,
|
|
|
|
size_t& utf8_bytes_index,
|
|
|
|
size_t& utf8_bytes_filled)
|
2018-04-02 01:12:36 +08:00
|
|
|
{
|
2018-10-03 20:51:49 +08:00
|
|
|
utf8_bytes_index = 0;
|
|
|
|
|
2020-05-28 14:29:53 +08:00
|
|
|
if (JSON_HEDLEY_UNLIKELY(input.empty()))
|
2018-10-03 20:51:49 +08:00
|
|
|
{
|
|
|
|
utf8_bytes[0] = std::char_traits<char>::eof();
|
|
|
|
utf8_bytes_filled = 1;
|
|
|
|
}
|
|
|
|
else
|
2018-04-02 01:12:36 +08:00
|
|
|
{
|
2018-10-03 20:51:49 +08:00
|
|
|
// get the current character
|
2020-05-28 00:40:04 +08:00
|
|
|
const auto wc = input.get_character();
|
2018-04-02 01:12:36 +08:00
|
|
|
|
2018-10-03 20:51:49 +08:00
|
|
|
// UTF-32 to UTF-8 encoding
|
|
|
|
if (wc < 0x80)
|
2018-04-02 01:12:36 +08:00
|
|
|
{
|
2019-03-17 07:27:44 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(wc);
|
2018-04-02 01:12:36 +08:00
|
|
|
utf8_bytes_filled = 1;
|
|
|
|
}
|
2018-10-03 20:51:49 +08:00
|
|
|
else if (wc <= 0x7FF)
|
|
|
|
{
|
2020-06-06 20:30:17 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(0xC0u | ((static_cast<unsigned int>(wc) >> 6u) & 0x1Fu));
|
|
|
|
utf8_bytes[1] = static_cast<std::char_traits<char>::int_type>(0x80u | (static_cast<unsigned int>(wc) & 0x3Fu));
|
2018-10-03 20:51:49 +08:00
|
|
|
utf8_bytes_filled = 2;
|
|
|
|
}
|
|
|
|
else if (wc <= 0xFFFF)
|
|
|
|
{
|
2020-06-06 20:30:17 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(0xE0u | ((static_cast<unsigned int>(wc) >> 12u) & 0x0Fu));
|
|
|
|
utf8_bytes[1] = static_cast<std::char_traits<char>::int_type>(0x80u | ((static_cast<unsigned int>(wc) >> 6u) & 0x3Fu));
|
|
|
|
utf8_bytes[2] = static_cast<std::char_traits<char>::int_type>(0x80u | (static_cast<unsigned int>(wc) & 0x3Fu));
|
2018-10-03 20:51:49 +08:00
|
|
|
utf8_bytes_filled = 3;
|
|
|
|
}
|
|
|
|
else if (wc <= 0x10FFFF)
|
|
|
|
{
|
2020-06-06 20:30:17 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(0xF0u | ((static_cast<unsigned int>(wc) >> 18u) & 0x07u));
|
|
|
|
utf8_bytes[1] = static_cast<std::char_traits<char>::int_type>(0x80u | ((static_cast<unsigned int>(wc) >> 12u) & 0x3Fu));
|
|
|
|
utf8_bytes[2] = static_cast<std::char_traits<char>::int_type>(0x80u | ((static_cast<unsigned int>(wc) >> 6u) & 0x3Fu));
|
|
|
|
utf8_bytes[3] = static_cast<std::char_traits<char>::int_type>(0x80u | (static_cast<unsigned int>(wc) & 0x3Fu));
|
2018-10-03 20:51:49 +08:00
|
|
|
utf8_bytes_filled = 4;
|
2018-04-02 01:12:36 +08:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2018-10-03 20:51:49 +08:00
|
|
|
// unknown character
|
2019-03-17 07:27:44 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(wc);
|
2018-10-03 20:51:49 +08:00
|
|
|
utf8_bytes_filled = 1;
|
2018-04-02 01:12:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2018-10-03 20:51:49 +08:00
|
|
|
};
|
2018-04-02 01:12:36 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
template<typename BaseInputAdapter>
|
|
|
|
struct wide_string_input_helper<BaseInputAdapter, 2>
|
2018-10-03 20:51:49 +08:00
|
|
|
{
|
|
|
|
// UTF-16
|
2020-05-28 00:40:04 +08:00
|
|
|
static void fill_buffer(BaseInputAdapter& input,
|
2019-03-17 07:27:44 +08:00
|
|
|
std::array<std::char_traits<char>::int_type, 4>& utf8_bytes,
|
|
|
|
size_t& utf8_bytes_index,
|
|
|
|
size_t& utf8_bytes_filled)
|
2018-04-02 01:12:36 +08:00
|
|
|
{
|
|
|
|
utf8_bytes_index = 0;
|
|
|
|
|
2020-05-28 14:29:53 +08:00
|
|
|
if (JSON_HEDLEY_UNLIKELY(input.empty()))
|
2018-04-02 01:12:36 +08:00
|
|
|
{
|
|
|
|
utf8_bytes[0] = std::char_traits<char>::eof();
|
|
|
|
utf8_bytes_filled = 1;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
// get the current character
|
2020-05-28 00:40:04 +08:00
|
|
|
const auto wc = input.get_character();
|
2018-04-02 01:12:36 +08:00
|
|
|
|
|
|
|
// UTF-16 to UTF-8 encoding
|
|
|
|
if (wc < 0x80)
|
|
|
|
{
|
2019-03-17 07:27:44 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(wc);
|
2018-04-02 01:12:36 +08:00
|
|
|
utf8_bytes_filled = 1;
|
|
|
|
}
|
|
|
|
else if (wc <= 0x7FF)
|
|
|
|
{
|
2020-06-08 04:47:25 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(0xC0u | ((static_cast<unsigned int>(wc) >> 6u)));
|
|
|
|
utf8_bytes[1] = static_cast<std::char_traits<char>::int_type>(0x80u | (static_cast<unsigned int>(wc) & 0x3Fu));
|
2018-04-02 01:12:36 +08:00
|
|
|
utf8_bytes_filled = 2;
|
|
|
|
}
|
2020-06-03 20:20:36 +08:00
|
|
|
else if (0xD800 > wc || wc >= 0xE000)
|
2018-04-02 01:12:36 +08:00
|
|
|
{
|
2020-06-08 04:47:25 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(0xE0u | ((static_cast<unsigned int>(wc) >> 12u)));
|
|
|
|
utf8_bytes[1] = static_cast<std::char_traits<char>::int_type>(0x80u | ((static_cast<unsigned int>(wc) >> 6u) & 0x3Fu));
|
|
|
|
utf8_bytes[2] = static_cast<std::char_traits<char>::int_type>(0x80u | (static_cast<unsigned int>(wc) & 0x3Fu));
|
2018-04-02 01:12:36 +08:00
|
|
|
utf8_bytes_filled = 3;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2020-07-11 19:39:14 +08:00
|
|
|
if (JSON_HEDLEY_UNLIKELY(!input.empty()))
|
2018-04-02 01:12:36 +08:00
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
const auto wc2 = static_cast<unsigned int>(input.get_character());
|
2020-06-08 04:47:25 +08:00
|
|
|
const auto charcode = 0x10000u + (((static_cast<unsigned int>(wc) & 0x3FFu) << 10u) | (wc2 & 0x3FFu));
|
2019-03-17 07:27:44 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(0xF0u | (charcode >> 18u));
|
|
|
|
utf8_bytes[1] = static_cast<std::char_traits<char>::int_type>(0x80u | ((charcode >> 12u) & 0x3Fu));
|
|
|
|
utf8_bytes[2] = static_cast<std::char_traits<char>::int_type>(0x80u | ((charcode >> 6u) & 0x3Fu));
|
|
|
|
utf8_bytes[3] = static_cast<std::char_traits<char>::int_type>(0x80u | (charcode & 0x3Fu));
|
2018-04-02 01:12:36 +08:00
|
|
|
utf8_bytes_filled = 4;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2019-03-17 07:27:44 +08:00
|
|
|
utf8_bytes[0] = static_cast<std::char_traits<char>::int_type>(wc);
|
2018-04-02 01:12:36 +08:00
|
|
|
utf8_bytes_filled = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2018-10-03 20:51:49 +08:00
|
|
|
};
|
2018-04-02 01:12:36 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
// Wraps another input apdater to convert wide character types into individual bytes.
|
|
|
|
template<typename BaseInputAdapter, typename WideCharType>
|
2020-02-20 03:59:31 +08:00
|
|
|
class wide_string_input_adapter
|
2018-10-03 19:41:34 +08:00
|
|
|
{
|
|
|
|
public:
|
2020-06-06 20:30:17 +08:00
|
|
|
using char_type = char;
|
2018-04-02 01:12:36 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
wide_string_input_adapter(BaseInputAdapter base)
|
|
|
|
: base_adapter(base) {}
|
2018-04-02 01:12:36 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
typename std::char_traits<char>::int_type get_character() noexcept
|
2018-10-03 19:41:34 +08:00
|
|
|
{
|
|
|
|
// check if buffer needs to be filled
|
|
|
|
if (utf8_bytes_index == utf8_bytes_filled)
|
2018-04-02 01:12:36 +08:00
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
fill_buffer<sizeof(WideCharType)>();
|
2018-04-02 01:12:36 +08:00
|
|
|
|
2020-07-06 18:22:31 +08:00
|
|
|
JSON_ASSERT(utf8_bytes_filled > 0);
|
|
|
|
JSON_ASSERT(utf8_bytes_index == 0);
|
2018-04-02 01:12:36 +08:00
|
|
|
}
|
2018-10-03 19:41:34 +08:00
|
|
|
|
|
|
|
// use buffer
|
2020-07-06 18:22:31 +08:00
|
|
|
JSON_ASSERT(utf8_bytes_filled > 0);
|
|
|
|
JSON_ASSERT(utf8_bytes_index < utf8_bytes_filled);
|
2018-10-03 19:41:34 +08:00
|
|
|
return utf8_bytes[utf8_bytes_index++];
|
2018-04-02 01:12:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
2020-05-28 00:40:04 +08:00
|
|
|
BaseInputAdapter base_adapter;
|
|
|
|
|
2018-10-03 19:41:34 +08:00
|
|
|
template<size_t T>
|
|
|
|
void fill_buffer()
|
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
wide_string_input_helper<BaseInputAdapter, T>::fill_buffer(base_adapter, utf8_bytes, utf8_bytes_index, utf8_bytes_filled);
|
2018-10-03 19:41:34 +08:00
|
|
|
}
|
2018-10-05 02:42:19 +08:00
|
|
|
|
2018-04-02 01:12:36 +08:00
|
|
|
/// a buffer for UTF-8 bytes
|
|
|
|
std::array<std::char_traits<char>::int_type, 4> utf8_bytes = {{0, 0, 0, 0}};
|
|
|
|
|
|
|
|
/// index to the utf8_codes array for the next valid byte
|
|
|
|
std::size_t utf8_bytes_index = 0;
|
|
|
|
/// number of valid bytes in the utf8_codes array
|
|
|
|
std::size_t utf8_bytes_filled = 0;
|
|
|
|
};
|
|
|
|
|
2020-02-19 23:32:49 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
template<typename IteratorType, typename Enable = void>
|
|
|
|
struct iterator_input_adapter_factory
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
using iterator_type = IteratorType;
|
|
|
|
using char_type = typename std::iterator_traits<iterator_type>::value_type;
|
|
|
|
using adapter_type = iterator_input_adapter<iterator_type>;
|
2020-02-19 23:32:49 +08:00
|
|
|
|
2020-05-28 14:29:53 +08:00
|
|
|
static adapter_type create(IteratorType first, IteratorType last)
|
2020-05-28 00:40:04 +08:00
|
|
|
{
|
2020-05-28 14:29:53 +08:00
|
|
|
return adapter_type(std::move(first), std::move(last));
|
2020-05-28 00:40:04 +08:00
|
|
|
}
|
|
|
|
};
|
2020-02-19 23:32:49 +08:00
|
|
|
|
2020-05-28 14:29:53 +08:00
|
|
|
template<typename T>
|
2020-06-09 02:07:15 +08:00
|
|
|
struct is_iterator_of_multibyte
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
2020-06-09 02:07:15 +08:00
|
|
|
using value_type = typename std::iterator_traits<T>::value_type;
|
|
|
|
enum
|
|
|
|
{
|
|
|
|
value = sizeof(value_type) > 1
|
|
|
|
};
|
|
|
|
};
|
2020-02-19 23:32:49 +08:00
|
|
|
|
2020-05-28 14:29:53 +08:00
|
|
|
template<typename IteratorType>
|
2020-06-09 02:07:15 +08:00
|
|
|
struct iterator_input_adapter_factory<IteratorType, enable_if_t<is_iterator_of_multibyte<IteratorType>::value>>
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
2020-05-28 14:29:53 +08:00
|
|
|
using iterator_type = IteratorType;
|
|
|
|
using char_type = typename std::iterator_traits<iterator_type>::value_type;
|
|
|
|
using base_adapter_type = iterator_input_adapter<iterator_type>;
|
|
|
|
using adapter_type = wide_string_input_adapter<base_adapter_type, char_type>;
|
2020-02-19 23:32:49 +08:00
|
|
|
|
2020-05-28 14:29:53 +08:00
|
|
|
static adapter_type create(IteratorType first, IteratorType last)
|
|
|
|
{
|
|
|
|
return adapter_type(base_adapter_type(std::move(first), std::move(last)));
|
|
|
|
}
|
|
|
|
};
|
2020-02-19 23:32:49 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
// General purpose iterator-based input
|
|
|
|
template<typename IteratorType>
|
2020-05-28 14:29:53 +08:00
|
|
|
typename iterator_input_adapter_factory<IteratorType>::adapter_type input_adapter(IteratorType first, IteratorType last)
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
using factory_type = iterator_input_adapter_factory<IteratorType>;
|
2020-05-28 14:29:53 +08:00
|
|
|
return factory_type::create(first, last);
|
2020-02-19 23:32:49 +08:00
|
|
|
}
|
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
// Convenience shorthand from container to iterator
|
2020-12-29 05:20:37 +08:00
|
|
|
// Enables ADL on begin(container) and end(container)
|
|
|
|
// Encloses the using declarations in namespace for not to leak them to outside scope
|
|
|
|
|
2020-12-30 04:36:30 +08:00
|
|
|
namespace container_input_adapter_factory_impl
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
|
|
|
|
2020-12-29 05:20:37 +08:00
|
|
|
using std::begin;
|
|
|
|
using std::end;
|
|
|
|
|
|
|
|
template<typename ContainerType, typename Enable = void>
|
|
|
|
struct container_input_adapter_factory {};
|
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
template<typename ContainerType>
|
2020-12-29 05:20:37 +08:00
|
|
|
struct container_input_adapter_factory< ContainerType,
|
2020-12-30 04:36:30 +08:00
|
|
|
void_t<decltype(begin(std::declval<ContainerType>()), end(std::declval<ContainerType>()))>>
|
|
|
|
{
|
|
|
|
using adapter_type = decltype(input_adapter(begin(std::declval<ContainerType>()), end(std::declval<ContainerType>())));
|
2020-12-29 05:20:37 +08:00
|
|
|
|
2020-12-30 04:36:30 +08:00
|
|
|
static adapter_type create(const ContainerType& container)
|
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
return input_adapter(begin(container), end(container));
|
2020-02-19 23:32:49 +08:00
|
|
|
}
|
2020-12-30 04:36:30 +08:00
|
|
|
};
|
2020-12-29 05:20:37 +08:00
|
|
|
|
2021-03-24 14:15:18 +08:00
|
|
|
} // namespace container_input_adapter_factory_impl
|
2020-02-19 23:32:49 +08:00
|
|
|
|
2020-12-29 05:20:37 +08:00
|
|
|
template<typename ContainerType>
|
|
|
|
typename container_input_adapter_factory_impl::container_input_adapter_factory<ContainerType>::adapter_type input_adapter(const ContainerType& container)
|
|
|
|
{
|
|
|
|
return container_input_adapter_factory_impl::container_input_adapter_factory<ContainerType>::create(container);
|
2020-02-19 23:32:49 +08:00
|
|
|
}
|
|
|
|
|
2021-04-21 16:24:01 +08:00
|
|
|
#ifndef JSON_NO_IO
|
2020-05-28 00:40:04 +08:00
|
|
|
// Special cases with fast paths
|
|
|
|
inline file_input_adapter input_adapter(std::FILE* file)
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
return file_input_adapter(file);
|
2020-02-19 23:32:49 +08:00
|
|
|
}
|
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
inline input_stream_adapter input_adapter(std::istream& stream)
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
return input_stream_adapter(stream);
|
2020-02-19 23:32:49 +08:00
|
|
|
}
|
2017-08-14 22:48:55 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
inline input_stream_adapter input_adapter(std::istream&& stream)
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
return input_stream_adapter(stream);
|
2020-02-19 23:32:49 +08:00
|
|
|
}
|
2021-04-21 16:24:01 +08:00
|
|
|
#endif // JSON_NO_IO
|
2020-02-19 23:32:49 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
using contiguous_bytes_input_adapter = decltype(input_adapter(std::declval<const char*>(), std::declval<const char*>()));
|
2018-04-02 01:12:36 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
// Null-delimited strings, and the like.
|
2020-05-28 06:21:38 +08:00
|
|
|
template < typename CharT,
|
|
|
|
typename std::enable_if <
|
2020-06-27 19:16:20 +08:00
|
|
|
std::is_pointer<CharT>::value&&
|
2020-07-11 19:39:14 +08:00
|
|
|
!std::is_array<CharT>::value&&
|
2020-06-27 19:16:20 +08:00
|
|
|
std::is_integral<typename std::remove_pointer<CharT>::type>::value&&
|
2020-05-28 06:21:38 +08:00
|
|
|
sizeof(typename std::remove_pointer<CharT>::type) == 1,
|
|
|
|
int >::type = 0 >
|
2020-05-28 00:40:04 +08:00
|
|
|
contiguous_bytes_input_adapter input_adapter(CharT b)
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
2020-05-28 00:40:04 +08:00
|
|
|
auto length = std::strlen(reinterpret_cast<const char*>(b));
|
2020-06-23 04:32:21 +08:00
|
|
|
const auto* ptr = reinterpret_cast<const char*>(b);
|
2020-05-28 00:40:04 +08:00
|
|
|
return input_adapter(ptr, ptr + length);
|
2020-02-19 23:32:49 +08:00
|
|
|
}
|
2018-04-02 01:12:36 +08:00
|
|
|
|
2020-05-28 06:21:38 +08:00
|
|
|
template<typename T, std::size_t N>
|
2021-03-24 14:15:18 +08:00
|
|
|
auto input_adapter(T (&array)[N]) -> decltype(input_adapter(array, array + N)) // NOLINT(cppcoreguidelines-avoid-c-arrays,hicpp-avoid-c-arrays,modernize-avoid-c-arrays)
|
2020-02-19 23:32:49 +08:00
|
|
|
{
|
2020-05-28 06:21:38 +08:00
|
|
|
return input_adapter(array, array + N);
|
2020-02-19 23:32:49 +08:00
|
|
|
}
|
2018-04-02 01:12:36 +08:00
|
|
|
|
2020-02-19 23:32:49 +08:00
|
|
|
// This class only handles inputs of input_buffer_adapter type.
|
2021-12-29 20:41:01 +08:00
|
|
|
// It's required so that expressions like {ptr, len} can be implicitly cast
|
2020-02-19 23:32:49 +08:00
|
|
|
// to the correct adapter.
|
|
|
|
class span_input_adapter
|
|
|
|
{
|
|
|
|
public:
|
2020-06-03 20:20:36 +08:00
|
|
|
template < typename CharT,
|
|
|
|
typename std::enable_if <
|
|
|
|
std::is_pointer<CharT>::value&&
|
|
|
|
std::is_integral<typename std::remove_pointer<CharT>::type>::value&&
|
|
|
|
sizeof(typename std::remove_pointer<CharT>::type) == 1,
|
|
|
|
int >::type = 0 >
|
2020-02-19 23:32:49 +08:00
|
|
|
span_input_adapter(CharT b, std::size_t l)
|
2020-05-28 00:40:04 +08:00
|
|
|
: ia(reinterpret_cast<const char*>(b), reinterpret_cast<const char*>(b) + l) {}
|
2017-08-14 22:48:55 +08:00
|
|
|
|
|
|
|
template<class IteratorType,
|
|
|
|
typename std::enable_if<
|
2018-11-08 02:39:25 +08:00
|
|
|
std::is_same<typename iterator_traits<IteratorType>::iterator_category, std::random_access_iterator_tag>::value,
|
2017-08-14 22:48:55 +08:00
|
|
|
int>::type = 0>
|
2020-02-19 23:32:49 +08:00
|
|
|
span_input_adapter(IteratorType first, IteratorType last)
|
|
|
|
: ia(input_adapter(first, last)) {}
|
2017-08-14 22:48:55 +08:00
|
|
|
|
2020-05-28 00:40:04 +08:00
|
|
|
contiguous_bytes_input_adapter&& get()
|
2017-08-14 22:48:55 +08:00
|
|
|
{
|
2021-03-24 14:15:18 +08:00
|
|
|
return std::move(ia); // NOLINT(hicpp-move-const-arg,performance-move-const-arg)
|
2017-08-14 22:48:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
2020-05-28 00:40:04 +08:00
|
|
|
contiguous_bytes_input_adapter ia;
|
2017-08-14 22:48:55 +08:00
|
|
|
};
|
2018-10-08 00:39:18 +08:00
|
|
|
} // namespace detail
|
|
|
|
} // namespace nlohmann
|