// Copyright 2011-2023 David Robillard // SPDX-License-Identifier: ISC #ifndef SERD_SRC_READER_H #define SERD_SRC_READER_H #include "byte_source.h" #include "node.h" #include "stack.h" #include "serd/attributes.h" #include "serd/error.h" #include "serd/node.h" #include "serd/reader.h" #include "serd/sink.h" #include "serd/statement.h" #include "serd/status.h" #include "serd/syntax.h" #include #include #include #include #ifdef SERD_STACK_CHECK # define SERD_STACK_ASSERT_TOP(reader, ref) \ assert(ref == reader->allocs[reader->n_allocs - 1]); #else # define SERD_STACK_ASSERT_TOP(reader, ref) #endif typedef struct { SerdNode* graph; SerdNode* subject; SerdNode* predicate; SerdNode* object; SerdNode* datatype; SerdNode* lang; SerdStatementFlags* flags; } ReadContext; struct SerdReaderImpl { const SerdSink* sink; SerdErrorFunc error_func; void* error_handle; SerdNode* rdf_first; SerdNode* rdf_rest; SerdNode* rdf_nil; SerdNode* default_graph; SerdByteSource source; SerdStack stack; SerdSyntax syntax; unsigned next_id; uint8_t* buf; char* bprefix; size_t bprefix_len; bool strict; ///< True iff strict parsing bool seen_genid; #ifdef SERD_STACK_CHECK SerdNode** allocs; ///< Stack of push offsets size_t n_allocs; ///< Number of stack pushes #endif }; SERD_LOG_FUNC(3, 4) SerdStatus r_err(SerdReader* reader, SerdStatus st, const char* fmt, ...); SerdNode* push_node_padded(SerdReader* reader, size_t maxlen, SerdNodeType type, const char* str, size_t length); SerdNode* push_node(SerdReader* reader, SerdNodeType type, const char* str, size_t length); SERD_PURE_FUNC size_t genid_size(const SerdReader* reader); SerdNode* blank_id(SerdReader* reader); void set_blank_id(SerdReader* reader, SerdNode* node, size_t buf_size); SerdNode* pop_node(SerdReader* reader, const SerdNode* node); SerdStatus emit_statement(SerdReader* reader, ReadContext ctx, SerdNode* o); SerdStatus read_n3_statement(SerdReader* reader); SerdStatus read_nquads_statement(SerdReader* reader); SerdStatus read_nquadsDoc(SerdReader* reader); SerdStatus read_turtleTrigDoc(SerdReader* reader); static inline int peek_byte(SerdReader* reader) { SerdByteSource* source = &reader->source; return source->eof ? EOF : (int)source->read_buf[source->read_head]; } static inline SerdStatus skip_byte(SerdReader* reader, const int byte) { (void)byte; assert(peek_byte(reader) == byte); return serd_byte_source_advance(&reader->source); } static inline int SERD_NODISCARD eat_byte_safe(SerdReader* reader, const int byte) { (void)byte; assert(peek_byte(reader) == byte); serd_byte_source_advance(&reader->source); return byte; } static inline int SERD_NODISCARD eat_byte_check(SerdReader* reader, const int byte) { const int c = peek_byte(reader); if (c != byte) { r_err(reader, SERD_BAD_SYNTAX, "expected '%c', not '%c'\n", byte, c); return 0; } return eat_byte_safe(reader, byte); } static inline SerdStatus eat_string(SerdReader* reader, const char* str, unsigned n) { for (unsigned i = 0; i < n; ++i) { if (!eat_byte_check(reader, str[i])) { return SERD_BAD_SYNTAX; } } return SERD_SUCCESS; } static inline SerdStatus push_byte(SerdReader* reader, SerdNode* node, const int c) { assert(c != EOF); SERD_STACK_ASSERT_TOP(reader, ref); char* const s = (char*)serd_stack_push(&reader->stack, 1); if (!s) { return SERD_BAD_STACK; } *(s - 1) = (char)c; *s = '\0'; ++node->length; return SERD_SUCCESS; } static inline SerdStatus push_bytes(SerdReader* reader, SerdNode* ref, const uint8_t* bytes, unsigned len) { if (reader->stack.buf_size < reader->stack.size + len) { return SERD_BAD_STACK; } for (unsigned i = 0; i < len; ++i) { push_byte(reader, ref, bytes[i]); } return SERD_SUCCESS; } #endif // SERD_SRC_READER_H