1#ifndef SIMDJSON_PARSER_INL_H
2#define SIMDJSON_PARSER_INL_H
4#include "simdjson/dom/base.h"
5#include "simdjson/dom/document_stream.h"
6#include "simdjson/implementation.h"
7#include "simdjson/internal/dom_parser_implementation.h"
9#include "simdjson/error-inl.h"
10#include "simdjson/padded_string-inl.h"
11#include "simdjson/dom/document_stream-inl.h"
12#include "simdjson/dom/element-inl.h"
24 : _max_capacity{max_capacity},
25 loaded_bytes(
nullptr) {
30inline bool parser::is_valid() const noexcept {
return valid; }
31inline int parser::get_error_code() const noexcept {
return error; }
32inline std::string parser::get_error_message() const noexcept {
return error_message(error); }
34inline bool parser::dump_raw_tape(std::ostream &os)
const noexcept {
35 return valid ? doc.dump_raw_tape(os) :
false;
38inline simdjson_result<size_t> parser::read_file(std::string_view path)
noexcept {
39 const std::string path_copy(path);
41 SIMDJSON_PUSH_DISABLE_WARNINGS
42 SIMDJSON_DISABLE_DEPRECATED_WARNING
43 std::FILE *fp = std::fopen(path_copy.c_str(),
"rb");
44 SIMDJSON_POP_DISABLE_WARNINGS
52#if SIMDJSON_VISUAL_STUDIO && !SIMDJSON_IS_32BITS
53 ret = _fseeki64(fp, 0, SEEK_END);
55 ret = std::fseek(fp, 0, SEEK_END);
61#if SIMDJSON_VISUAL_STUDIO && !SIMDJSON_IS_32BITS
62 __int64 len = _ftelli64(fp);
68 long len = std::ftell(fp);
69 if((len < 0) || (len == LONG_MAX)) {
76 if (_loaded_bytes_capacity <
size_t(len)) {
77 loaded_bytes.reset( internal::allocate_padded_buffer(len) );
82 _loaded_bytes_capacity = len;
87 size_t bytes_read = std::fread(loaded_bytes.get(), 1, len, fp);
88 if (std::fclose(fp) != 0 || bytes_read !=
size_t(len)) {
96 return load_into_document(doc, path);
101 auto _error = read_file(path).
get(len);
102 if (_error) {
return _error; }
103 return parse_into_document(provided_doc, loaded_bytes.get(), len,
false);
108 auto _error = read_file(path).
get(len);
109 if (_error) {
return _error; }
110 if(batch_size < MINIMAL_BATCH_SIZE) { batch_size = MINIMAL_BATCH_SIZE; }
111 return document_stream(*
this,
reinterpret_cast<const uint8_t*
>(loaded_bytes.get()), len, batch_size);
117 error_code _error = ensure_capacity(provided_doc, len);
118 if (_error) {
return _error; }
119 if (realloc_if_needed) {
121 if (!loaded_bytes || _loaded_bytes_capacity < len) {
122 loaded_bytes.reset( internal::allocate_padded_buffer(len) );
126 _loaded_bytes_capacity = len;
128 std::memcpy(
static_cast<void *
>(loaded_bytes.get()), buf, len);
129 buf =
reinterpret_cast<const uint8_t*
>(loaded_bytes.get());
132 if((len >= 3) && (std::memcmp(buf,
"\xEF\xBB\xBF", 3) == 0)) {
139 if (_error) {
return _error; }
141 return provided_doc.root();
145 return parse_into_document(provided_doc,
reinterpret_cast<const uint8_t *
>(buf), len, realloc_if_needed);
148 return parse_into_document(provided_doc, s.data(), s.length(), s.capacity() - s.length() <
SIMDJSON_PADDING);
151 return parse_into_document(provided_doc, s.data(), s.length(),
false);
156 return parse_into_document(doc, buf, len, realloc_if_needed);
160 return parse(
reinterpret_cast<const uint8_t *
>(buf), len, realloc_if_needed);
163 return parse(s.data(), s.length(), s.capacity() - s.length() <
SIMDJSON_PADDING);
165simdjson_inline simdjson_result<element>
parser::parse(
const padded_string &s) &
noexcept {
166 return parse(s.data(), s.length(),
false);
168simdjson_inline simdjson_result<element>
parser::parse(
const padded_string_view &v) &
noexcept {
169 return parse(v.data(), v.length(),
false);
173 if(batch_size < MINIMAL_BATCH_SIZE) { batch_size = MINIMAL_BATCH_SIZE; }
174 if((len >= 3) && (std::memcmp(buf,
"\xEF\xBB\xBF", 3) == 0)) {
181 return parse_many(
reinterpret_cast<const uint8_t *
>(buf), len, batch_size);
184 return parse_many(s.data(), s.length(), batch_size);
186inline simdjson_result<document_stream>
parser::parse_many(
const padded_string &s,
size_t batch_size)
noexcept {
187 return parse_many(s.data(), s.length(), batch_size);
194 return _max_capacity;
211 if (err) {
return err; }
215#ifndef SIMDJSON_DISABLE_DEPRECATED_API
217inline bool parser::allocate_capacity(
size_t capacity,
size_t max_depth)
noexcept {
218 return !allocate(capacity, max_depth);
222inline error_code parser::ensure_capacity(
size_t desired_capacity)
noexcept {
223 return ensure_capacity(doc, desired_capacity);
227inline error_code parser::ensure_capacity(document& target_document,
size_t desired_capacity)
noexcept {
230 if(desired_capacity < MINIMAL_DOCUMENT_CAPACITY) { desired_capacity = MINIMAL_DOCUMENT_CAPACITY; }
237 if (simdjson_unlikely(capacity() < desired_capacity || target_document.capacity() < desired_capacity)) {
238 if (desired_capacity > max_capacity()) {
241 error_code err1 = target_document.capacity() < desired_capacity ? target_document.allocate(desired_capacity) :
SUCCESS;
242 error_code err2 = capacity() < desired_capacity ? allocate(desired_capacity, max_depth()) :
SUCCESS;
243 if(err1 !=
SUCCESS) {
return error = err1; }
244 if(err2 !=
SUCCESS) {
return error = err2; }
250 if(max_capacity > MINIMAL_DOCUMENT_CAPACITY) {
251 _max_capacity = max_capacity;
253 _max_capacity = MINIMAL_DOCUMENT_CAPACITY;
A forward-only stream of documents.
simdjson_inline parser(size_t max_capacity=SIMDJSON_MAXSIZE_BYTES) noexcept
Create a JSON parser.
simdjson_result< element > parse(const uint8_t *buf, size_t len, bool realloc_if_needed=true) &noexcept
Parse a JSON document and return a temporary reference to it.
simdjson_result< element > parse_into_document(document &doc, const uint8_t *buf, size_t len, bool realloc_if_needed=true) &noexcept
Parse a JSON document into a provide document instance and return a temporary reference to it.
simdjson_result< document_stream > parse_many(const uint8_t *buf, size_t len, size_t batch_size=dom::DEFAULT_BATCH_SIZE) noexcept
Parse a buffer containing many JSON documents.
simdjson_inline void set_max_capacity(size_t max_capacity) noexcept
Set max_capacity.
simdjson_inline size_t max_capacity() const noexcept
The largest document this parser can automatically support.
simdjson_result< document_stream > load_many(std::string_view path, size_t batch_size=dom::DEFAULT_BATCH_SIZE) noexcept
Load a file containing many JSON documents.
simdjson_result< element > load_into_document(document &doc, std::string_view path) &noexcept
Load a JSON document from a file into a provide document instance and return a temporary reference to...
simdjson_pure simdjson_inline size_t max_depth() const noexcept
The maximum level of nested object and arrays supported by this parser.
simdjson_result< element > load(std::string_view path) &noexcept
Load a JSON document from a file and return a reference to it.
simdjson_inline size_t capacity() const noexcept
The largest document this parser can support without reallocating.
simdjson_inline parser & operator=(parser &&other) noexcept
Take another parser's buffers and state.
simdjson_warn_unused error_code allocate(size_t capacity, size_t max_depth=DEFAULT_MAX_DEPTH) noexcept
Ensure this parser has enough memory to process JSON documents up to capacity bytes in length and max...
An implementation of simdjson for a particular CPU architecture.
The top level simdjson namespace, containing everything the library provides.
SIMDJSON_DLLIMPORTEXPORT internal::atomic_ptr< const implementation > & get_active_implementation()
The active implementation.
const char * error_message(error_code error) noexcept
It is the convention throughout the code that the macro SIMDJSON_DEVELOPMENT_CHECKS determines whethe...
constexpr size_t DEFAULT_MAX_DEPTH
By default, simdjson supports this many nested objects and arrays.
error_code
All possible errors returned by simdjson.
@ CAPACITY
This parser can't support a document that big.
@ MEMALLOC
Error allocating memory, most likely out of memory.
@ IO_ERROR
Error reading a file.
constexpr size_t SIMDJSON_PADDING
The amount of padding needed in a buffer to parse JSON.
The result of a simdjson operation that could fail.
simdjson_warn_unused simdjson_inline error_code get(T &value) &&noexcept
Move the value to the provided variable.