1 #ifndef SIMDJSON_PARSER_INL_H
2 #define SIMDJSON_PARSER_INL_H
4 #include "simdjson/dom/base.h"
5 #include "simdjson/dom/document_stream.h"
6 #include "simdjson/implementation.h"
7 #include "simdjson/internal/dom_parser_implementation.h"
9 #include "simdjson/error-inl.h"
10 #include "simdjson/padded_string-inl.h"
11 #include "simdjson/dom/document_stream-inl.h"
12 #include "simdjson/dom/element-inl.h"
24 : _max_capacity{max_capacity},
25 loaded_bytes(
nullptr) {
30 inline bool parser::is_valid() const noexcept {
return valid; }
31 inline int parser::get_error_code() const noexcept {
return error; }
32 inline std::string parser::get_error_message() const noexcept {
return error_message(error); }
34 inline bool parser::dump_raw_tape(std::ostream &os)
const noexcept {
35 return valid ? doc.dump_raw_tape(os) :
false;
38 inline simdjson_result<size_t> parser::read_file(
const std::string &path) noexcept {
40 SIMDJSON_PUSH_DISABLE_WARNINGS
41 SIMDJSON_DISABLE_DEPRECATED_WARNING
42 std::FILE *fp = std::fopen(path.c_str(),
"rb");
43 SIMDJSON_POP_DISABLE_WARNINGS
51 #if SIMDJSON_VISUAL_STUDIO && !SIMDJSON_IS_32BITS
52 ret = _fseeki64(fp, 0, SEEK_END);
54 ret = std::fseek(fp, 0, SEEK_END);
60 #if SIMDJSON_VISUAL_STUDIO && !SIMDJSON_IS_32BITS
61 __int64 len = _ftelli64(fp);
67 long len = std::ftell(fp);
68 if((len < 0) || (len == LONG_MAX)) {
75 if (_loaded_bytes_capacity <
size_t(len)) {
76 loaded_bytes.reset( internal::allocate_padded_buffer(len) );
81 _loaded_bytes_capacity = len;
86 size_t bytes_read = std::fread(loaded_bytes.get(), 1, len, fp);
87 if (std::fclose(fp) != 0 || bytes_read !=
size_t(len)) {
95 return load_into_document(doc, path);
100 auto _error = read_file(path).get(len);
101 if (_error) {
return _error; }
102 return parse_into_document(provided_doc, loaded_bytes.get(), len,
false);
107 auto _error = read_file(path).get(len);
108 if (_error) {
return _error; }
109 if(batch_size < MINIMAL_BATCH_SIZE) { batch_size = MINIMAL_BATCH_SIZE; }
110 return document_stream(*
this,
reinterpret_cast<const uint8_t*
>(loaded_bytes.get()), len, batch_size);
116 error_code _error = ensure_capacity(provided_doc, len);
117 if (_error) {
return _error; }
118 if (realloc_if_needed) {
120 if (!loaded_bytes || _loaded_bytes_capacity < len) {
121 loaded_bytes.reset( internal::allocate_padded_buffer(len) );
125 _loaded_bytes_capacity = len;
127 std::memcpy(
static_cast<void *
>(loaded_bytes.get()), buf, len);
128 buf =
reinterpret_cast<const uint8_t*
>(loaded_bytes.get());
131 if((len >= 3) && (std::memcmp(buf,
"\xEF\xBB\xBF", 3) == 0)) {
137 if (_error) {
return _error; }
139 return provided_doc.root();
143 return parse_into_document(provided_doc,
reinterpret_cast<const uint8_t *
>(buf), len, realloc_if_needed);
146 return parse_into_document(provided_doc, s.data(), s.length(), s.capacity() - s.length() <
SIMDJSON_PADDING);
149 return parse_into_document(provided_doc, s.data(), s.length(),
false);
154 return parse_into_document(doc, buf, len, realloc_if_needed);
158 return parse(
reinterpret_cast<const uint8_t *
>(buf), len, realloc_if_needed);
161 return parse(s.data(), s.length(), s.capacity() - s.length() <
SIMDJSON_PADDING);
163 simdjson_inline simdjson_result<element>
parser::parse(
const padded_string &s) & noexcept {
164 return parse(s.data(), s.length(),
false);
166 simdjson_inline simdjson_result<element>
parser::parse(
const padded_string_view &v) & noexcept {
167 return parse(v.data(), v.length(),
false);
171 if(batch_size < MINIMAL_BATCH_SIZE) { batch_size = MINIMAL_BATCH_SIZE; }
172 if((len >= 3) && (std::memcmp(buf,
"\xEF\xBB\xBF", 3) == 0)) {
179 return parse_many(
reinterpret_cast<const uint8_t *
>(buf), len, batch_size);
182 return parse_many(s.data(), s.length(), batch_size);
184 inline simdjson_result<document_stream>
parser::parse_many(
const padded_string &s,
size_t batch_size) noexcept {
185 return parse_many(s.data(), s.length(), batch_size);
192 return _max_capacity;
209 if (err) {
return err; }
213 #ifndef SIMDJSON_DISABLE_DEPRECATED_API
215 inline bool parser::allocate_capacity(
size_t capacity,
size_t max_depth) noexcept {
216 return !allocate(capacity, max_depth);
220 inline error_code parser::ensure_capacity(
size_t desired_capacity) noexcept {
221 return ensure_capacity(doc, desired_capacity);
225 inline error_code parser::ensure_capacity(document& target_document,
size_t desired_capacity) noexcept {
228 if(desired_capacity < MINIMAL_DOCUMENT_CAPACITY) { desired_capacity = MINIMAL_DOCUMENT_CAPACITY; }
235 if (simdjson_unlikely(capacity() < desired_capacity || target_document.capacity() < desired_capacity)) {
236 if (desired_capacity > max_capacity()) {
239 error_code err1 = target_document.capacity() < desired_capacity ? target_document.allocate(desired_capacity) :
SUCCESS;
240 error_code err2 = capacity() < desired_capacity ? allocate(desired_capacity, max_depth()) :
SUCCESS;
241 if(err1 !=
SUCCESS) {
return error = err1; }
242 if(err2 !=
SUCCESS) {
return error = err2; }
248 if(max_capacity > MINIMAL_DOCUMENT_CAPACITY) {
249 _max_capacity = max_capacity;
251 _max_capacity = MINIMAL_DOCUMENT_CAPACITY;
A forward-only stream of documents.
simdjson_inline parser(size_t max_capacity=SIMDJSON_MAXSIZE_BYTES) noexcept
Create a JSON parser.
simdjson_result< element > parse(const uint8_t *buf, size_t len, bool realloc_if_needed=true) &noexcept
Parse a JSON document and return a temporary reference to it.
simdjson_result< element > parse_into_document(document &doc, const uint8_t *buf, size_t len, bool realloc_if_needed=true) &noexcept
Parse a JSON document into a provide document instance and return a temporary reference to it.
simdjson_result< document_stream > load_many(const std::string &path, size_t batch_size=dom::DEFAULT_BATCH_SIZE) noexcept
Load a file containing many JSON documents.
simdjson_inline void set_max_capacity(size_t max_capacity) noexcept
Set max_capacity.
simdjson_inline size_t max_capacity() const noexcept
The largest document this parser can automatically support.
simdjson_pure simdjson_inline size_t max_depth() const noexcept
The maximum level of nested object and arrays supported by this parser.
simdjson_result< element > load(const std::string &path) &noexcept
Load a JSON document from a file and return a reference to it.
simdjson_result< element > load_into_document(document &doc, const std::string &path) &noexcept
Load a JSON document from a file into a provide document instance and return a temporary reference to...
simdjson_inline size_t capacity() const noexcept
The largest document this parser can support without reallocating.
simdjson_inline parser & operator=(parser &&other) noexcept
Take another parser's buffers and state.
simdjson_warn_unused error_code allocate(size_t capacity, size_t max_depth=DEFAULT_MAX_DEPTH) noexcept
Ensure this parser has enough memory to process JSON documents up to capacity bytes in length and max...
simdjson_result< document_stream > parse_many(const uint8_t *buf, size_t len, size_t batch_size=dom::DEFAULT_BATCH_SIZE) noexcept
Parse a buffer containing many JSON documents.
An implementation of simdjson for a particular CPU architecture.
The top level simdjson namespace, containing everything the library provides.
const char * error_message(error_code error) noexcept
It is the convention throughout the code that the macro SIMDJSON_DEVELOPMENT_CHECKS determines whethe...
constexpr size_t DEFAULT_MAX_DEPTH
By default, simdjson supports this many nested objects and arrays.
error_code
All possible errors returned by simdjson.
@ CAPACITY
This parser can't support a document that big.
@ MEMALLOC
Error allocating memory, most likely out of memory.
@ IO_ERROR
Error reading a file.
SIMDJSON_DLLIMPORTEXPORT internal::atomic_ptr< const implementation > & get_active_implementation()
The active implementation.
constexpr size_t SIMDJSON_PADDING
The amount of padding needed in a buffer to parse JSON.
The result of a simdjson operation that could fail.