mirror of
https://github.com/RetroDECK/Duckstation.git
synced 2025-01-20 23:35:39 +00:00
707 lines
32 KiB
C++
707 lines
32 KiB
C++
|
#ifndef _C4_YML_PARSE_HPP_
|
||
|
#define _C4_YML_PARSE_HPP_
|
||
|
|
||
|
#ifndef _C4_YML_TREE_HPP_
|
||
|
#include "c4/yml/tree.hpp"
|
||
|
#endif
|
||
|
|
||
|
#ifndef _C4_YML_NODE_HPP_
|
||
|
#include "c4/yml/node.hpp"
|
||
|
#endif
|
||
|
|
||
|
#ifndef _C4_YML_DETAIL_STACK_HPP_
|
||
|
#include "c4/yml/detail/stack.hpp"
|
||
|
#endif
|
||
|
|
||
|
#include <stdarg.h>
|
||
|
|
||
|
#if defined(_MSC_VER)
|
||
|
# pragma warning(push)
|
||
|
# pragma warning(disable: 4251/*needs to have dll-interface to be used by clients of struct*/)
|
||
|
#endif
|
||
|
|
||
|
namespace c4 {
|
||
|
namespace yml {
|
||
|
|
||
|
struct RYML_EXPORT ParserOptions
|
||
|
{
|
||
|
private:
|
||
|
|
||
|
typedef enum : uint32_t {
|
||
|
LOCATIONS = (1 << 0),
|
||
|
DEFAULTS = 0,
|
||
|
} Flags_e;
|
||
|
|
||
|
uint32_t flags = DEFAULTS;
|
||
|
public:
|
||
|
ParserOptions() = default;
|
||
|
|
||
|
/** @name source location tracking */
|
||
|
/** @{ */
|
||
|
|
||
|
/** enable/disable source location tracking */
|
||
|
ParserOptions& locations(bool enabled)
|
||
|
{
|
||
|
if(enabled)
|
||
|
flags |= LOCATIONS;
|
||
|
else
|
||
|
flags &= ~LOCATIONS;
|
||
|
return *this;
|
||
|
}
|
||
|
bool locations() const { return (flags & LOCATIONS) != 0u; }
|
||
|
|
||
|
/** @} */
|
||
|
};
|
||
|
|
||
|
|
||
|
//-----------------------------------------------------------------------------
|
||
|
//-----------------------------------------------------------------------------
|
||
|
//-----------------------------------------------------------------------------
|
||
|
class RYML_EXPORT Parser
|
||
|
{
|
||
|
public:
|
||
|
|
||
|
/** @name construction and assignment */
|
||
|
/** @{ */
|
||
|
|
||
|
Parser(Callbacks const& cb, ParserOptions opts={});
|
||
|
Parser(ParserOptions opts={}) : Parser(get_callbacks(), opts) {}
|
||
|
~Parser();
|
||
|
|
||
|
Parser(Parser &&);
|
||
|
Parser(Parser const&);
|
||
|
Parser& operator=(Parser &&);
|
||
|
Parser& operator=(Parser const&);
|
||
|
|
||
|
/** @} */
|
||
|
|
||
|
public:
|
||
|
|
||
|
/** @name modifiers */
|
||
|
/** @{ */
|
||
|
|
||
|
/** Reserve a certain capacity for the parsing stack.
|
||
|
* This should be larger than the expected depth of the parsed
|
||
|
* YAML tree.
|
||
|
*
|
||
|
* The parsing stack is the only (potential) heap memory used by
|
||
|
* the parser.
|
||
|
*
|
||
|
* If the requested capacity is below the default
|
||
|
* stack size of 16, the memory is used directly in the parser
|
||
|
* object; otherwise it will be allocated from the heap.
|
||
|
*
|
||
|
* @note this reserves memory only for the parser itself; all the
|
||
|
* allocations for the parsed tree will go through the tree's
|
||
|
* allocator.
|
||
|
*
|
||
|
* @note the tree and the arena can (and should) also be reserved. */
|
||
|
void reserve_stack(size_t capacity)
|
||
|
{
|
||
|
m_stack.reserve(capacity);
|
||
|
}
|
||
|
|
||
|
/** Reserve a certain capacity for the array used to track node
|
||
|
* locations in the source buffer. */
|
||
|
void reserve_locations(size_t num_source_lines)
|
||
|
{
|
||
|
_resize_locations(num_source_lines);
|
||
|
}
|
||
|
|
||
|
/** Reserve a certain capacity for the character arena used to
|
||
|
* filter scalars. */
|
||
|
void reserve_filter_arena(size_t num_characters)
|
||
|
{
|
||
|
_resize_filter_arena(num_characters);
|
||
|
}
|
||
|
|
||
|
/** @} */
|
||
|
|
||
|
public:
|
||
|
|
||
|
/** @name getters and modifiers */
|
||
|
/** @{ */
|
||
|
|
||
|
/** Get the current callbacks in the parser. */
|
||
|
Callbacks callbacks() const { return m_stack.m_callbacks; }
|
||
|
|
||
|
/** Get the name of the latest file parsed by this object. */
|
||
|
csubstr filename() const { return m_file; }
|
||
|
|
||
|
/** Get the latest YAML buffer parsed by this object. */
|
||
|
csubstr source() const { return m_buf; }
|
||
|
|
||
|
size_t stack_capacity() const { return m_stack.capacity(); }
|
||
|
size_t locations_capacity() const { return m_newline_offsets_capacity; }
|
||
|
size_t filter_arena_capacity() const { return m_filter_arena.len; }
|
||
|
|
||
|
ParserOptions const& options() const { return m_options; }
|
||
|
|
||
|
/** @} */
|
||
|
|
||
|
public:
|
||
|
|
||
|
/** @name parse_in_place */
|
||
|
/** @{ */
|
||
|
|
||
|
/** Create a new tree and parse into its root.
|
||
|
* The tree is created with the callbacks currently in the parser. */
|
||
|
Tree parse_in_place(csubstr filename, substr src)
|
||
|
{
|
||
|
Tree t(callbacks());
|
||
|
t.reserve(_estimate_capacity(src));
|
||
|
this->parse_in_place(filename, src, &t, t.root_id());
|
||
|
return t;
|
||
|
}
|
||
|
|
||
|
/** Parse into an existing tree, starting at its root node.
|
||
|
* The callbacks in the tree are kept, and used to allocate
|
||
|
* the tree members, if any allocation is required. */
|
||
|
void parse_in_place(csubstr filename, substr src, Tree *t)
|
||
|
{
|
||
|
this->parse_in_place(filename, src, t, t->root_id());
|
||
|
}
|
||
|
|
||
|
/** Parse into an existing node.
|
||
|
* The callbacks in the tree are kept, and used to allocate
|
||
|
* the tree members, if any allocation is required. */
|
||
|
void parse_in_place(csubstr filename, substr src, Tree *t, size_t node_id);
|
||
|
// ^^^^^^^^^^^^^ this is the workhorse overload; everything else is syntactic candy
|
||
|
|
||
|
/** Parse into an existing node.
|
||
|
* The callbacks in the tree are kept, and used to allocate
|
||
|
* the tree members, if any allocation is required. */
|
||
|
void parse_in_place(csubstr filename, substr src, NodeRef node)
|
||
|
{
|
||
|
this->parse_in_place(filename, src, node.tree(), node.id());
|
||
|
}
|
||
|
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") Tree parse(csubstr filename, substr src) { return parse_in_place(filename, src); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") void parse(csubstr filename, substr src, Tree *t) { parse_in_place(filename, src, t); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") void parse(csubstr filename, substr src, Tree *t, size_t node_id) { parse_in_place(filename, src, t, node_id); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") void parse(csubstr filename, substr src, NodeRef node) { parse_in_place(filename, src, node); }
|
||
|
|
||
|
/** @} */
|
||
|
|
||
|
public:
|
||
|
|
||
|
/** @name parse_in_arena: copy the YAML source buffer to the
|
||
|
* tree's arena, then parse the copy in situ
|
||
|
*
|
||
|
* @note overloads receiving a substr YAML buffer are intentionally
|
||
|
* left undefined, such that calling parse_in_arena() with a substr
|
||
|
* will cause a linker error. This is to prevent an accidental
|
||
|
* copy of the source buffer to the tree's arena, because substr
|
||
|
* is implicitly convertible to csubstr. If you really intend to parse
|
||
|
* a mutable buffer in the tree's arena, convert it first to immutable
|
||
|
* by assigning the substr to a csubstr prior to calling parse_in_arena().
|
||
|
* This is not needed for parse_in_place() because csubstr is not
|
||
|
* implicitly convertible to substr. */
|
||
|
/** @{ */
|
||
|
|
||
|
// READ THE NOTE ABOVE!
|
||
|
#define RYML_DONT_PARSE_SUBSTR_IN_ARENA "Do not pass a (mutable) substr to parse_in_arena(); if you have a substr, it should be parsed in place. Consider using parse_in_place() instead, or convert the buffer to csubstr prior to calling. This function is deliberately left undefined and will cause a linker error."
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) Tree parse_in_arena(csubstr filename, substr csrc);
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) void parse_in_arena(csubstr filename, substr csrc, Tree *t);
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) void parse_in_arena(csubstr filename, substr csrc, Tree *t, size_t node_id);
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) void parse_in_arena(csubstr filename, substr csrc, NodeRef node);
|
||
|
|
||
|
/** Create a new tree and parse into its root.
|
||
|
* The immutable YAML source is first copied to the tree's arena,
|
||
|
* and parsed from there.
|
||
|
* The callbacks in the tree are kept, and used to allocate
|
||
|
* the tree members, if any allocation is required. */
|
||
|
Tree parse_in_arena(csubstr filename, csubstr csrc)
|
||
|
{
|
||
|
Tree t(callbacks());
|
||
|
substr src = t.copy_to_arena(csrc);
|
||
|
t.reserve(_estimate_capacity(csrc));
|
||
|
this->parse_in_place(filename, src, &t, t.root_id());
|
||
|
return t;
|
||
|
}
|
||
|
|
||
|
/** Parse into an existing tree, starting at its root node.
|
||
|
* The immutable YAML source is first copied to the tree's arena,
|
||
|
* and parsed from there.
|
||
|
* The callbacks in the tree are kept, and used to allocate
|
||
|
* the tree members, if any allocation is required. */
|
||
|
void parse_in_arena(csubstr filename, csubstr csrc, Tree *t)
|
||
|
{
|
||
|
substr src = t->copy_to_arena(csrc);
|
||
|
this->parse_in_place(filename, src, t, t->root_id());
|
||
|
}
|
||
|
|
||
|
/** Parse into a specific node in an existing tree.
|
||
|
* The immutable YAML source is first copied to the tree's arena,
|
||
|
* and parsed from there.
|
||
|
* The callbacks in the tree are kept, and used to allocate
|
||
|
* the tree members, if any allocation is required. */
|
||
|
void parse_in_arena(csubstr filename, csubstr csrc, Tree *t, size_t node_id)
|
||
|
{
|
||
|
substr src = t->copy_to_arena(csrc);
|
||
|
this->parse_in_place(filename, src, t, node_id);
|
||
|
}
|
||
|
|
||
|
/** Parse into a specific node in an existing tree.
|
||
|
* The immutable YAML source is first copied to the tree's arena,
|
||
|
* and parsed from there.
|
||
|
* The callbacks in the tree are kept, and used to allocate
|
||
|
* the tree members, if any allocation is required. */
|
||
|
void parse_in_arena(csubstr filename, csubstr csrc, NodeRef node)
|
||
|
{
|
||
|
substr src = node.tree()->copy_to_arena(csrc);
|
||
|
this->parse_in_place(filename, src, node.tree(), node.id());
|
||
|
}
|
||
|
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") Tree parse(csubstr filename, csubstr csrc) { return parse_in_arena(filename, csrc); }
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") void parse(csubstr filename, csubstr csrc, Tree *t) { parse_in_arena(filename, csrc, t); }
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") void parse(csubstr filename, csubstr csrc, Tree *t, size_t node_id) { parse_in_arena(filename, csrc, t, node_id); }
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") void parse(csubstr filename, csubstr csrc, NodeRef node) { parse_in_arena(filename, csrc, node); }
|
||
|
|
||
|
/** @} */
|
||
|
|
||
|
public:
|
||
|
|
||
|
/** @name locations */
|
||
|
/** @{ */
|
||
|
|
||
|
/** Get the location of a node of the last tree to be parsed by this parser. */
|
||
|
Location location(Tree const& tree, size_t node_id) const;
|
||
|
/** Get the location of a node of the last tree to be parsed by this parser. */
|
||
|
Location location(ConstNodeRef node) const;
|
||
|
/** Get the string starting at a particular location, to the end
|
||
|
* of the parsed source buffer. */
|
||
|
csubstr location_contents(Location const& loc) const;
|
||
|
/** Given a pointer to a buffer position, get the location. @p val
|
||
|
* must be pointing to somewhere in the source buffer that was
|
||
|
* last parsed by this object. */
|
||
|
Location val_location(const char *val) const;
|
||
|
|
||
|
/** @} */
|
||
|
|
||
|
private:
|
||
|
|
||
|
typedef enum {
|
||
|
BLOCK_LITERAL, //!< keep newlines (|)
|
||
|
BLOCK_FOLD //!< replace newline with single space (>)
|
||
|
} BlockStyle_e;
|
||
|
|
||
|
typedef enum {
|
||
|
CHOMP_CLIP, //!< single newline at end (default)
|
||
|
CHOMP_STRIP, //!< no newline at end (-)
|
||
|
CHOMP_KEEP //!< all newlines from end (+)
|
||
|
} BlockChomp_e;
|
||
|
|
||
|
private:
|
||
|
|
||
|
using flag_t = int;
|
||
|
|
||
|
static size_t _estimate_capacity(csubstr src) { size_t c = _count_nlines(src); c = c >= 16 ? c : 16; return c; }
|
||
|
|
||
|
void _reset();
|
||
|
|
||
|
bool _finished_file() const;
|
||
|
bool _finished_line() const;
|
||
|
|
||
|
csubstr _peek_next_line(size_t pos=npos) const;
|
||
|
bool _advance_to_peeked();
|
||
|
void _scan_line();
|
||
|
|
||
|
csubstr _slurp_doc_scalar();
|
||
|
|
||
|
/**
|
||
|
* @param [out] quoted
|
||
|
* Will only be written to if this method returns true.
|
||
|
* Will be set to true if the scanned scalar was quoted, by '', "", > or |.
|
||
|
*/
|
||
|
bool _scan_scalar_seq_blck(csubstr *C4_RESTRICT scalar, bool *C4_RESTRICT quoted);
|
||
|
bool _scan_scalar_map_blck(csubstr *C4_RESTRICT scalar, bool *C4_RESTRICT quoted);
|
||
|
bool _scan_scalar_seq_flow(csubstr *C4_RESTRICT scalar, bool *C4_RESTRICT quoted);
|
||
|
bool _scan_scalar_map_flow(csubstr *C4_RESTRICT scalar, bool *C4_RESTRICT quoted);
|
||
|
bool _scan_scalar_unk(csubstr *C4_RESTRICT scalar, bool *C4_RESTRICT quoted);
|
||
|
|
||
|
csubstr _scan_comment();
|
||
|
csubstr _scan_squot_scalar();
|
||
|
csubstr _scan_dquot_scalar();
|
||
|
csubstr _scan_block();
|
||
|
substr _scan_plain_scalar_blck(csubstr currscalar, csubstr peeked_line, size_t indentation);
|
||
|
substr _scan_plain_scalar_flow(csubstr currscalar, csubstr peeked_line);
|
||
|
substr _scan_complex_key(csubstr currscalar, csubstr peeked_line);
|
||
|
csubstr _scan_to_next_nonempty_line(size_t indentation);
|
||
|
csubstr _extend_scanned_scalar(csubstr currscalar);
|
||
|
|
||
|
csubstr _filter_squot_scalar(const substr s);
|
||
|
csubstr _filter_dquot_scalar(substr s);
|
||
|
csubstr _filter_plain_scalar(substr s, size_t indentation);
|
||
|
csubstr _filter_block_scalar(substr s, BlockStyle_e style, BlockChomp_e chomp, size_t indentation);
|
||
|
template<bool backslash_is_escape, bool keep_trailing_whitespace>
|
||
|
bool _filter_nl(substr scalar, size_t *C4_RESTRICT pos, size_t *C4_RESTRICT filter_arena_pos, size_t indentation);
|
||
|
template<bool keep_trailing_whitespace>
|
||
|
void _filter_ws(substr scalar, size_t *C4_RESTRICT pos, size_t *C4_RESTRICT filter_arena_pos);
|
||
|
bool _apply_chomp(substr buf, size_t *C4_RESTRICT pos, BlockChomp_e chomp);
|
||
|
|
||
|
void _handle_finished_file();
|
||
|
void _handle_line();
|
||
|
|
||
|
bool _handle_indentation();
|
||
|
|
||
|
bool _handle_unk();
|
||
|
bool _handle_map_flow();
|
||
|
bool _handle_map_blck();
|
||
|
bool _handle_seq_flow();
|
||
|
bool _handle_seq_blck();
|
||
|
bool _handle_top();
|
||
|
bool _handle_types();
|
||
|
bool _handle_key_anchors_and_refs();
|
||
|
bool _handle_val_anchors_and_refs();
|
||
|
void _move_val_tag_to_key_tag();
|
||
|
void _move_key_tag_to_val_tag();
|
||
|
void _move_key_tag2_to_key_tag();
|
||
|
void _move_val_anchor_to_key_anchor();
|
||
|
void _move_key_anchor_to_val_anchor();
|
||
|
|
||
|
void _push_level(bool explicit_flow_chars = false);
|
||
|
void _pop_level();
|
||
|
|
||
|
void _start_unk(bool as_child=true);
|
||
|
|
||
|
void _start_map(bool as_child=true);
|
||
|
void _start_map_unk(bool as_child);
|
||
|
void _stop_map();
|
||
|
|
||
|
void _start_seq(bool as_child=true);
|
||
|
void _stop_seq();
|
||
|
|
||
|
void _start_seqimap();
|
||
|
void _stop_seqimap();
|
||
|
|
||
|
void _start_doc(bool as_child=true);
|
||
|
void _stop_doc();
|
||
|
void _start_new_doc(csubstr rem);
|
||
|
void _end_stream();
|
||
|
|
||
|
NodeData* _append_val(csubstr val, flag_t quoted=false);
|
||
|
NodeData* _append_key_val(csubstr val, flag_t val_quoted=false);
|
||
|
bool _rval_dash_start_or_continue_seq();
|
||
|
|
||
|
void _store_scalar(csubstr s, flag_t is_quoted);
|
||
|
csubstr _consume_scalar();
|
||
|
void _move_scalar_from_top();
|
||
|
|
||
|
inline NodeData* _append_val_null(const char *str) { _RYML_CB_ASSERT(m_stack.m_callbacks, str >= m_buf.begin() && str <= m_buf.end()); return _append_val({nullptr, size_t(0)}); }
|
||
|
inline NodeData* _append_key_val_null(const char *str) { _RYML_CB_ASSERT(m_stack.m_callbacks, str >= m_buf.begin() && str <= m_buf.end()); return _append_key_val({nullptr, size_t(0)}); }
|
||
|
inline void _store_scalar_null(const char *str) { _RYML_CB_ASSERT(m_stack.m_callbacks, str >= m_buf.begin() && str <= m_buf.end()); _store_scalar({nullptr, size_t(0)}, false); }
|
||
|
|
||
|
void _set_indentation(size_t behind);
|
||
|
void _save_indentation(size_t behind=0);
|
||
|
bool _maybe_set_indentation_from_anchor_or_tag();
|
||
|
|
||
|
void _write_key_anchor(size_t node_id);
|
||
|
void _write_val_anchor(size_t node_id);
|
||
|
|
||
|
void _handle_directive(csubstr directive);
|
||
|
|
||
|
void _skipchars(char c);
|
||
|
template<size_t N>
|
||
|
void _skipchars(const char (&chars)[N]);
|
||
|
|
||
|
private:
|
||
|
|
||
|
static size_t _count_nlines(csubstr src);
|
||
|
|
||
|
private:
|
||
|
|
||
|
typedef enum : flag_t {
|
||
|
RTOP = 0x01 << 0, ///< reading at top level
|
||
|
RUNK = 0x01 << 1, ///< reading an unknown: must determine whether scalar, map or seq
|
||
|
RMAP = 0x01 << 2, ///< reading a map
|
||
|
RSEQ = 0x01 << 3, ///< reading a seq
|
||
|
FLOW = 0x01 << 4, ///< reading is inside explicit flow chars: [] or {}
|
||
|
QMRK = 0x01 << 5, ///< reading an explicit key (`? key`)
|
||
|
RKEY = 0x01 << 6, ///< reading a scalar as key
|
||
|
RVAL = 0x01 << 7, ///< reading a scalar as val
|
||
|
RNXT = 0x01 << 8, ///< read next val or keyval
|
||
|
SSCL = 0x01 << 9, ///< there's a stored scalar
|
||
|
QSCL = 0x01 << 10, ///< stored scalar was quoted
|
||
|
RSET = 0x01 << 11, ///< the (implicit) map being read is a !!set. @see https://yaml.org/type/set.html
|
||
|
NDOC = 0x01 << 12, ///< no document mode. a document has ended and another has not started yet.
|
||
|
//! reading an implicit map nested in an explicit seq.
|
||
|
//! eg, {key: [key2: value2, key3: value3]}
|
||
|
//! is parsed as {key: [{key2: value2}, {key3: value3}]}
|
||
|
RSEQIMAP = 0x01 << 13,
|
||
|
} State_e;
|
||
|
|
||
|
struct LineContents
|
||
|
{
|
||
|
csubstr full; ///< the full line, including newlines on the right
|
||
|
csubstr stripped; ///< the stripped line, excluding newlines on the right
|
||
|
csubstr rem; ///< the stripped line remainder; initially starts at the first non-space character
|
||
|
size_t indentation; ///< the number of spaces on the beginning of the line
|
||
|
|
||
|
LineContents() : full(), stripped(), rem(), indentation() {}
|
||
|
|
||
|
void reset_with_next_line(csubstr buf, size_t pos);
|
||
|
|
||
|
void reset(csubstr full_, csubstr stripped_)
|
||
|
{
|
||
|
full = full_;
|
||
|
stripped = stripped_;
|
||
|
rem = stripped_;
|
||
|
// find the first column where the character is not a space
|
||
|
indentation = full.first_not_of(' ');
|
||
|
}
|
||
|
|
||
|
size_t current_col() const
|
||
|
{
|
||
|
return current_col(rem);
|
||
|
}
|
||
|
|
||
|
size_t current_col(csubstr s) const
|
||
|
{
|
||
|
RYML_ASSERT(s.str >= full.str);
|
||
|
RYML_ASSERT(full.is_super(s));
|
||
|
size_t col = static_cast<size_t>(s.str - full.str);
|
||
|
return col;
|
||
|
}
|
||
|
};
|
||
|
|
||
|
struct State
|
||
|
{
|
||
|
flag_t flags;
|
||
|
size_t level;
|
||
|
size_t node_id; // don't hold a pointer to the node as it will be relocated during tree resizes
|
||
|
csubstr scalar;
|
||
|
size_t scalar_col; // the column where the scalar (or its quotes) begin
|
||
|
|
||
|
Location pos;
|
||
|
LineContents line_contents;
|
||
|
size_t indref;
|
||
|
|
||
|
State() : flags(), level(), node_id(), scalar(), scalar_col(), pos(), line_contents(), indref() {}
|
||
|
|
||
|
void reset(const char *file, size_t node_id_)
|
||
|
{
|
||
|
flags = RUNK|RTOP;
|
||
|
level = 0;
|
||
|
pos.name = to_csubstr(file);
|
||
|
pos.offset = 0;
|
||
|
pos.line = 1;
|
||
|
pos.col = 1;
|
||
|
node_id = node_id_;
|
||
|
scalar_col = 0;
|
||
|
scalar.clear();
|
||
|
indref = 0;
|
||
|
}
|
||
|
};
|
||
|
|
||
|
void _line_progressed(size_t ahead);
|
||
|
void _line_ended();
|
||
|
void _line_ended_undo();
|
||
|
|
||
|
void _prepare_pop()
|
||
|
{
|
||
|
RYML_ASSERT(m_stack.size() > 1);
|
||
|
State const& curr = m_stack.top();
|
||
|
State & next = m_stack.top(1);
|
||
|
next.pos = curr.pos;
|
||
|
next.line_contents = curr.line_contents;
|
||
|
next.scalar = curr.scalar;
|
||
|
}
|
||
|
|
||
|
inline bool _at_line_begin() const
|
||
|
{
|
||
|
return m_state->line_contents.rem.begin() == m_state->line_contents.full.begin();
|
||
|
}
|
||
|
inline bool _at_line_end() const
|
||
|
{
|
||
|
csubstr r = m_state->line_contents.rem;
|
||
|
return r.empty() || r.begins_with(' ', r.len);
|
||
|
}
|
||
|
inline bool _token_is_from_this_line(csubstr token) const
|
||
|
{
|
||
|
return token.is_sub(m_state->line_contents.full);
|
||
|
}
|
||
|
|
||
|
inline NodeData * node(State const* s) const { return m_tree->get(s->node_id); }
|
||
|
inline NodeData * node(State const& s) const { return m_tree->get(s .node_id); }
|
||
|
inline NodeData * node(size_t node_id) const { return m_tree->get( node_id); }
|
||
|
|
||
|
inline bool has_all(flag_t f) const { return (m_state->flags & f) == f; }
|
||
|
inline bool has_any(flag_t f) const { return (m_state->flags & f) != 0; }
|
||
|
inline bool has_none(flag_t f) const { return (m_state->flags & f) == 0; }
|
||
|
|
||
|
static inline bool has_all(flag_t f, State const* s) { return (s->flags & f) == f; }
|
||
|
static inline bool has_any(flag_t f, State const* s) { return (s->flags & f) != 0; }
|
||
|
static inline bool has_none(flag_t f, State const* s) { return (s->flags & f) == 0; }
|
||
|
|
||
|
inline void set_flags(flag_t f) { set_flags(f, m_state); }
|
||
|
inline void add_flags(flag_t on) { add_flags(on, m_state); }
|
||
|
inline void addrem_flags(flag_t on, flag_t off) { addrem_flags(on, off, m_state); }
|
||
|
inline void rem_flags(flag_t off) { rem_flags(off, m_state); }
|
||
|
|
||
|
void set_flags(flag_t f, State * s);
|
||
|
void add_flags(flag_t on, State * s);
|
||
|
void addrem_flags(flag_t on, flag_t off, State * s);
|
||
|
void rem_flags(flag_t off, State * s);
|
||
|
|
||
|
void _resize_filter_arena(size_t num_characters);
|
||
|
void _grow_filter_arena(size_t num_characters);
|
||
|
substr _finish_filter_arena(substr dst, size_t pos);
|
||
|
|
||
|
void _prepare_locations();
|
||
|
void _resize_locations(size_t sz);
|
||
|
bool _locations_dirty() const;
|
||
|
|
||
|
bool _location_from_cont(Tree const& tree, size_t node, Location *C4_RESTRICT loc) const;
|
||
|
bool _location_from_node(Tree const& tree, size_t node, Location *C4_RESTRICT loc, size_t level) const;
|
||
|
|
||
|
private:
|
||
|
|
||
|
void _free();
|
||
|
void _clr();
|
||
|
void _cp(Parser const* that);
|
||
|
void _mv(Parser *that);
|
||
|
|
||
|
#ifdef RYML_DBG
|
||
|
template<class ...Args> void _dbg(csubstr fmt, Args const& C4_RESTRICT ...args) const;
|
||
|
#endif
|
||
|
template<class ...Args> void _err(csubstr fmt, Args const& C4_RESTRICT ...args) const;
|
||
|
template<class DumpFn> void _fmt_msg(DumpFn &&dumpfn) const;
|
||
|
static csubstr _prfl(substr buf, flag_t v);
|
||
|
|
||
|
private:
|
||
|
|
||
|
ParserOptions m_options;
|
||
|
|
||
|
csubstr m_file;
|
||
|
substr m_buf;
|
||
|
|
||
|
size_t m_root_id;
|
||
|
Tree * m_tree;
|
||
|
|
||
|
detail::stack<State> m_stack;
|
||
|
State * m_state;
|
||
|
|
||
|
size_t m_key_tag_indentation;
|
||
|
size_t m_key_tag2_indentation;
|
||
|
csubstr m_key_tag;
|
||
|
csubstr m_key_tag2;
|
||
|
size_t m_val_tag_indentation;
|
||
|
csubstr m_val_tag;
|
||
|
|
||
|
bool m_key_anchor_was_before;
|
||
|
size_t m_key_anchor_indentation;
|
||
|
csubstr m_key_anchor;
|
||
|
size_t m_val_anchor_indentation;
|
||
|
csubstr m_val_anchor;
|
||
|
|
||
|
substr m_filter_arena;
|
||
|
|
||
|
size_t *m_newline_offsets;
|
||
|
size_t m_newline_offsets_size;
|
||
|
size_t m_newline_offsets_capacity;
|
||
|
csubstr m_newline_offsets_buf;
|
||
|
};
|
||
|
|
||
|
|
||
|
//-----------------------------------------------------------------------------
|
||
|
//-----------------------------------------------------------------------------
|
||
|
//-----------------------------------------------------------------------------
|
||
|
|
||
|
/** @name parse_in_place
|
||
|
*
|
||
|
* @desc parse a mutable YAML source buffer.
|
||
|
*
|
||
|
* @note These freestanding functions use a temporary parser object,
|
||
|
* and are convenience functions to easily parse YAML without the need
|
||
|
* to instantiate a separate parser. Note that some properties
|
||
|
* (notably node locations in the original source code) are only
|
||
|
* available through the parser object after it has parsed the
|
||
|
* code. If you need access to any of these properties, use
|
||
|
* Parser::parse_in_place() */
|
||
|
/** @{ */
|
||
|
|
||
|
inline Tree parse_in_place( substr yaml ) { Parser np; return np.parse_in_place({} , yaml); } //!< parse in-situ a modifiable YAML source buffer.
|
||
|
inline Tree parse_in_place(csubstr filename, substr yaml ) { Parser np; return np.parse_in_place(filename, yaml); } //!< parse in-situ a modifiable YAML source buffer, providing a filename for error messages.
|
||
|
inline void parse_in_place( substr yaml, Tree *t ) { Parser np; np.parse_in_place({} , yaml, t); } //!< reusing the YAML tree, parse in-situ a modifiable YAML source buffer
|
||
|
inline void parse_in_place(csubstr filename, substr yaml, Tree *t ) { Parser np; np.parse_in_place(filename, yaml, t); } //!< reusing the YAML tree, parse in-situ a modifiable YAML source buffer, providing a filename for error messages.
|
||
|
inline void parse_in_place( substr yaml, Tree *t, size_t node_id) { Parser np; np.parse_in_place({} , yaml, t, node_id); } //!< reusing the YAML tree, parse in-situ a modifiable YAML source buffer
|
||
|
inline void parse_in_place(csubstr filename, substr yaml, Tree *t, size_t node_id) { Parser np; np.parse_in_place(filename, yaml, t, node_id); } //!< reusing the YAML tree, parse in-situ a modifiable YAML source buffer, providing a filename for error messages.
|
||
|
inline void parse_in_place( substr yaml, NodeRef node ) { Parser np; np.parse_in_place({} , yaml, node); } //!< reusing the YAML tree, parse in-situ a modifiable YAML source buffer
|
||
|
inline void parse_in_place(csubstr filename, substr yaml, NodeRef node ) { Parser np; np.parse_in_place(filename, yaml, node); } //!< reusing the YAML tree, parse in-situ a modifiable YAML source buffer, providing a filename for error messages.
|
||
|
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") inline Tree parse( substr yaml ) { Parser np; return np.parse_in_place({} , yaml); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") inline Tree parse(csubstr filename, substr yaml ) { Parser np; return np.parse_in_place(filename, yaml); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") inline void parse( substr yaml, Tree *t ) { Parser np; np.parse_in_place({} , yaml, t); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") inline void parse(csubstr filename, substr yaml, Tree *t ) { Parser np; np.parse_in_place(filename, yaml, t); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") inline void parse( substr yaml, Tree *t, size_t node_id) { Parser np; np.parse_in_place({} , yaml, t, node_id); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") inline void parse(csubstr filename, substr yaml, Tree *t, size_t node_id) { Parser np; np.parse_in_place(filename, yaml, t, node_id); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") inline void parse( substr yaml, NodeRef node ) { Parser np; np.parse_in_place({} , yaml, node); }
|
||
|
RYML_DEPRECATED("use parse_in_place() instead") inline void parse(csubstr filename, substr yaml, NodeRef node ) { Parser np; np.parse_in_place(filename, yaml, node); }
|
||
|
|
||
|
/** @} */
|
||
|
|
||
|
|
||
|
//-----------------------------------------------------------------------------
|
||
|
|
||
|
/** @name parse_in_arena
|
||
|
* @desc parse a read-only YAML source buffer, copying it first to the tree's arena.
|
||
|
*
|
||
|
* @note These freestanding functions use a temporary parser object,
|
||
|
* and are convenience functions to easily parse YAML without the need
|
||
|
* to instantiate a separate parser. Note that some properties
|
||
|
* (notably node locations in the original source code) are only
|
||
|
* available through the parser object after it has parsed the
|
||
|
* code. If you need access to any of these properties, use
|
||
|
* Parser::parse_in_arena().
|
||
|
*
|
||
|
* @note overloads receiving a substr YAML buffer are intentionally
|
||
|
* left undefined, such that calling parse_in_arena() with a substr
|
||
|
* will cause a linker error. This is to prevent an accidental
|
||
|
* copy of the source buffer to the tree's arena, because substr
|
||
|
* is implicitly convertible to csubstr. If you really intend to parse
|
||
|
* a mutable buffer in the tree's arena, convert it first to immutable
|
||
|
* by assigning the substr to a csubstr prior to calling parse_in_arena().
|
||
|
* This is not needed for parse_in_place() because csubstr is not
|
||
|
* implicitly convertible to substr. */
|
||
|
/** @{ */
|
||
|
|
||
|
/* READ THE NOTE ABOVE! */
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) Tree parse_in_arena( substr yaml );
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) Tree parse_in_arena(csubstr filename, substr yaml );
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) void parse_in_arena( substr yaml, Tree *t );
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) void parse_in_arena(csubstr filename, substr yaml, Tree *t );
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) void parse_in_arena( substr yaml, Tree *t, size_t node_id);
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) void parse_in_arena(csubstr filename, substr yaml, Tree *t, size_t node_id);
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) void parse_in_arena( substr yaml, NodeRef node );
|
||
|
RYML_DEPRECATED(RYML_DONT_PARSE_SUBSTR_IN_ARENA) void parse_in_arena(csubstr filename, substr yaml, NodeRef node );
|
||
|
|
||
|
inline Tree parse_in_arena( csubstr yaml ) { Parser np; return np.parse_in_arena({} , yaml); } //!< parse a read-only YAML source buffer, copying it first to the tree's source arena.
|
||
|
inline Tree parse_in_arena(csubstr filename, csubstr yaml ) { Parser np; return np.parse_in_arena(filename, yaml); } //!< parse a read-only YAML source buffer, copying it first to the tree's source arena, providing a filename for error messages.
|
||
|
inline void parse_in_arena( csubstr yaml, Tree *t ) { Parser np; np.parse_in_arena({} , yaml, t); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena.
|
||
|
inline void parse_in_arena(csubstr filename, csubstr yaml, Tree *t ) { Parser np; np.parse_in_arena(filename, yaml, t); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena, providing a filename for error messages.
|
||
|
inline void parse_in_arena( csubstr yaml, Tree *t, size_t node_id) { Parser np; np.parse_in_arena({} , yaml, t, node_id); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena.
|
||
|
inline void parse_in_arena(csubstr filename, csubstr yaml, Tree *t, size_t node_id) { Parser np; np.parse_in_arena(filename, yaml, t, node_id); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena, providing a filename for error messages.
|
||
|
inline void parse_in_arena( csubstr yaml, NodeRef node ) { Parser np; np.parse_in_arena({} , yaml, node); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena.
|
||
|
inline void parse_in_arena(csubstr filename, csubstr yaml, NodeRef node ) { Parser np; np.parse_in_arena(filename, yaml, node); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena, providing a filename for error messages.
|
||
|
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") inline Tree parse( csubstr yaml ) { Parser np; return np.parse_in_arena({} , yaml); } //!< parse a read-only YAML source buffer, copying it first to the tree's source arena.
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") inline Tree parse(csubstr filename, csubstr yaml ) { Parser np; return np.parse_in_arena(filename, yaml); } //!< parse a read-only YAML source buffer, copying it first to the tree's source arena, providing a filename for error messages.
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") inline void parse( csubstr yaml, Tree *t ) { Parser np; np.parse_in_arena({} , yaml, t); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena.
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") inline void parse(csubstr filename, csubstr yaml, Tree *t ) { Parser np; np.parse_in_arena(filename, yaml, t); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena, providing a filename for error messages.
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") inline void parse( csubstr yaml, Tree *t, size_t node_id) { Parser np; np.parse_in_arena({} , yaml, t, node_id); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena.
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") inline void parse(csubstr filename, csubstr yaml, Tree *t, size_t node_id) { Parser np; np.parse_in_arena(filename, yaml, t, node_id); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena, providing a filename for error messages.
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") inline void parse( csubstr yaml, NodeRef node ) { Parser np; np.parse_in_arena({} , yaml, node); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena.
|
||
|
RYML_DEPRECATED("use parse_in_arena() instead") inline void parse(csubstr filename, csubstr yaml, NodeRef node ) { Parser np; np.parse_in_arena(filename, yaml, node); } //!< reusing the YAML tree, parse a read-only YAML source buffer, copying it first to the tree's source arena, providing a filename for error messages.
|
||
|
|
||
|
/** @} */
|
||
|
|
||
|
} // namespace yml
|
||
|
} // namespace c4
|
||
|
|
||
|
#if defined(_MSC_VER)
|
||
|
# pragma warning(pop)
|
||
|
#endif
|
||
|
|
||
|
#endif /* _C4_YML_PARSE_HPP_ */
|