diff options
author | David Robillard <d@drobilla.net> | 2023-09-10 13:39:56 -0400 |
---|---|---|
committer | David Robillard <d@drobilla.net> | 2023-12-02 18:49:07 -0500 |
commit | d80b2a1c153f81685d026f8e09c12175abed3d03 (patch) | |
tree | 8207788e58ee9de94ca224433a02a88e8fed3801 | |
parent | 76fabe903adb09e6fe4d084ff6be49115285e086 (diff) | |
download | serd-d80b2a1c153f81685d026f8e09c12175abed3d03.tar.gz serd-d80b2a1c153f81685d026f8e09c12175abed3d03.tar.bz2 serd-d80b2a1c153f81685d026f8e09c12175abed3d03.zip |
Separate Turtle and TriG reading code
-rw-r--r-- | include/serd/world.h | 2 | ||||
-rw-r--r-- | meson.build | 3 | ||||
-rw-r--r-- | src/read_trig.c | 203 | ||||
-rw-r--r-- | src/read_trig.h | 24 | ||||
-rw-r--r-- | src/read_turtle.c (renamed from src/n3.c) | 190 | ||||
-rw-r--r-- | src/read_turtle.h | 89 | ||||
-rw-r--r-- | src/reader.c | 35 | ||||
-rw-r--r-- | src/reader.h | 9 | ||||
-rw-r--r-- | test/test_syntax.c | 3 |
9 files changed, 405 insertions, 153 deletions
diff --git a/include/serd/world.h b/include/serd/world.h index 4c51df73..86e43bb1 100644 --- a/include/serd/world.h +++ b/include/serd/world.h @@ -51,7 +51,7 @@ serd_world_free(SerdWorld* ZIX_NULLABLE world); a megabyte and over 100 levels of nesting, which is more than enough for most data. */ -SERD_API SerdLimits +SERD_PURE_API SerdLimits serd_world_limits(const SerdWorld* ZIX_NONNULL world); /** diff --git a/meson.build b/meson.build index df3f237f..366c8faf 100644 --- a/meson.build +++ b/meson.build @@ -155,10 +155,11 @@ sources = files( 'src/byte_source.c', 'src/caret.c', 'src/env.c', - 'src/n3.c', 'src/node.c', 'src/read_nquads.c', 'src/read_ntriples.c', + 'src/read_trig.c', + 'src/read_turtle.c', 'src/read_utf8.c', 'src/reader.c', 'src/sink.c', diff --git a/src/read_trig.c b/src/read_trig.c new file mode 100644 index 00000000..45ac39a0 --- /dev/null +++ b/src/read_trig.c @@ -0,0 +1,203 @@ +// Copyright 2011-2023 David Robillard <d@drobilla.net> +// SPDX-License-Identifier: ISC + +#include "read_trig.h" +#include "read_ntriples.h" +#include "read_turtle.h" +#include "reader.h" +#include "stack.h" +#include "try.h" + +#include "serd/node.h" +#include "serd/reader.h" +#include "serd/statement.h" +#include "serd/status.h" + +#include <stdbool.h> +#include <stdio.h> + +static SerdStatus +read_wrappedGraph(SerdReader* const reader, ReadContext* const ctx) +{ + SerdStatus st = SERD_SUCCESS; + TRY(st, eat_byte_check(reader, '{')); + read_turtle_ws_star(reader); + + while (peek_byte(reader) != '}') { + const size_t orig_stack_size = reader->stack.size; + bool ate_dot = false; + int s_type = 0; + + ctx->subject = 0; + if ((st = read_turtle_subject(reader, *ctx, &ctx->subject, &s_type))) { + return r_err(reader, st, "expected subject"); + } + + if ((st = read_turtle_triples(reader, *ctx, &ate_dot)) && s_type != '[') { + return r_err(reader, st, "bad predicate object list"); + } + + serd_stack_pop_to(&reader->stack, orig_stack_size); + read_turtle_ws_star(reader); + if (peek_byte(reader) == '.') { + skip_byte(reader, '.'); + } + read_turtle_ws_star(reader); + } + + skip_byte(reader, '}'); + read_turtle_ws_star(reader); + if (peek_byte(reader) == '.') { + return r_err(reader, SERD_BAD_SYNTAX, "graph followed by '.'"); + } + + return SERD_SUCCESS; +} + +static SerdStatus +read_labelOrSubject(SerdReader* const reader, SerdNode** const dest) +{ + SerdStatus st = SERD_SUCCESS; + bool ate_dot = false; + + switch (peek_byte(reader)) { + case '[': + skip_byte(reader, '['); + read_turtle_ws_star(reader); + TRY(st, eat_byte_check(reader, ']')); + *dest = blank_id(reader); + return *dest ? SERD_SUCCESS : SERD_BAD_STACK; + case '_': + return read_BLANK_NODE_LABEL(reader, dest, &ate_dot); + default: + if (!read_turtle_iri(reader, dest, &ate_dot)) { + return SERD_SUCCESS; + } else { + return r_err(reader, SERD_BAD_SYNTAX, "expected label or subject"); + } + } +} + +static SerdStatus +read_sparql_directive(SerdReader* const reader, + ReadContext* const ctx, + const SerdNode* const token) +{ + if (!tokcmp(token, "base", 4)) { + return read_turtle_base(reader, true, false); + } + + if (!tokcmp(token, "prefix", 6)) { + return read_turtle_prefixID(reader, true, false); + } + + if (!tokcmp(token, "graph", 5)) { + SerdStatus st = SERD_SUCCESS; + read_turtle_ws_star(reader); + TRY(st, read_labelOrSubject(reader, &ctx->graph)); + read_turtle_ws_star(reader); + return read_wrappedGraph(reader, ctx); + } + + return SERD_FAILURE; +} + +static SerdStatus +read_block(SerdReader* const reader, ReadContext* const ctx) +{ + SerdStatus st = SERD_SUCCESS; + + // Try to read a subject, though it may actually be a directive or graph name + SerdNode* token = NULL; + int s_type = 0; + if ((st = read_turtle_subject(reader, *ctx, &token, &s_type)) > + SERD_FAILURE) { + return st; + } + + // Try to interpret as a SPARQL "PREFIX" or "BASE" directive + if (st && (st = read_sparql_directive(reader, ctx, token)) != SERD_FAILURE) { + return st; + } + + // Try to interpret as a named TriG graph like "graphname { ..." + read_turtle_ws_star(reader); + if (peek_byte(reader) == '{') { + if (s_type == '(' || (s_type == '[' && !*ctx->flags)) { + return r_err(reader, SERD_BAD_SYNTAX, "invalid graph name"); + } + + ctx->graph = token; + return read_wrappedGraph(reader, ctx); + } + + if (st) { + return r_err(reader, SERD_BAD_SYNTAX, "expected directive or subject"); + } + + // Our token is really a subject, read some triples + bool ate_dot = false; + ctx->subject = token; + if ((st = read_turtle_triples(reader, *ctx, &ate_dot)) > SERD_FAILURE) { + return st; + } + + // "Failure" is only allowed for anonymous subjects like "[ ... ] ." + if (st && s_type != '[') { + return r_err(reader, SERD_BAD_SYNTAX, "expected triples"); + } + + // Ensure that triples are properly terminated + return ate_dot ? st : eat_byte_check(reader, '.'); +} + +SerdStatus +read_trig_statement(SerdReader* const reader) +{ + SerdStatementFlags flags = 0; + ReadContext ctx = {0, 0, 0, 0, &flags}; + + // Handle nice cases we can distinguish from the next byte + read_turtle_ws_star(reader); + switch (peek_byte(reader)) { + case EOF: + return SERD_FAILURE; + + case '\0': + eat_byte(reader); + return SERD_FAILURE; + + case '@': + return read_turtle_directive(reader); + + case '{': + return read_wrappedGraph(reader, &ctx); + + default: + break; + } + + // No such luck, figure out what to read from the first token + return read_block(reader, &ctx); +} + +SerdStatus +read_trigDoc(SerdReader* const reader) +{ + while (!reader->source.eof) { + const size_t orig_stack_size = reader->stack.size; + const SerdStatus st = read_trig_statement(reader); + + if (st > SERD_FAILURE) { + if (!tolerate_status(reader, st)) { + serd_stack_pop_to(&reader->stack, orig_stack_size); + return st; + } + serd_reader_skip_until_byte(reader, '\n'); + } + + serd_stack_pop_to(&reader->stack, orig_stack_size); + } + + return SERD_SUCCESS; +} diff --git a/src/read_trig.h b/src/read_trig.h new file mode 100644 index 00000000..a73f39d1 --- /dev/null +++ b/src/read_trig.h @@ -0,0 +1,24 @@ +// Copyright 2011-2023 David Robillard <d@drobilla.net> +// SPDX-License-Identifier: ISC + +#ifndef SERD_SRC_READ_TRIG_H +#define SERD_SRC_READ_TRIG_H + +#include "serd/reader.h" +#include "serd/status.h" + +/** + Read a single TriG statement. +*/ +SerdStatus +read_trig_statement(SerdReader* reader); + +/** + Read a complete TriG document. + + RDF 1.1 Trig: [1] trigDoc +*/ +SerdStatus +read_trigDoc(SerdReader* reader); + +#endif // SERD_SRC_READ_TRIG_H diff --git a/src/n3.c b/src/read_turtle.c index b731feaf..ef76c858 100644 --- a/src/n3.c +++ b/src/read_turtle.c @@ -1,6 +1,7 @@ // Copyright 2011-2023 David Robillard <d@drobilla.net> // SPDX-License-Identifier: ISC +#include "read_turtle.h" #include "byte_source.h" #include "namespaces.h" #include "node.h" @@ -18,7 +19,6 @@ #include "serd/statement.h" #include "serd/status.h" #include "serd/string_view.h" -#include "serd/syntax.h" #include <assert.h> #include <stdbool.h> @@ -51,8 +51,8 @@ read_whitespace(SerdReader* const reader) return SERD_FAILURE; } -static bool -read_ws_star(SerdReader* const reader) +bool +read_turtle_ws_star(SerdReader* const reader) { while (!read_whitespace(reader)) { } @@ -63,7 +63,7 @@ read_ws_star(SerdReader* const reader) static bool peek_delim(SerdReader* const reader, const uint8_t delim) { - read_ws_star(reader); + read_turtle_ws_star(reader); return peek_byte(reader) == delim; } @@ -72,7 +72,7 @@ eat_delim(SerdReader* const reader, const uint8_t delim) { if (peek_delim(reader, delim)) { skip_byte(reader, delim); - return read_ws_star(reader); + return read_turtle_ws_star(reader); } return false; @@ -403,8 +403,10 @@ read_number(SerdReader* const reader, return meta ? SERD_SUCCESS : SERD_BAD_STACK; } -static SerdStatus -read_iri(SerdReader* const reader, SerdNode** const dest, bool* const ate_dot) +SerdStatus +read_turtle_iri(SerdReader* const reader, + SerdNode** const dest, + bool* const ate_dot) { switch (peek_byte(reader)) { case '<': @@ -441,7 +443,7 @@ read_literal(SerdReader* const reader, skip_byte(reader, '^'); TRY(st, eat_byte_check(reader, '^')); (*dest)->flags |= SERD_HAS_DATATYPE; - TRY(st, read_iri(reader, &datatype, ate_dot)); + TRY(st, read_turtle_iri(reader, &datatype, ate_dot)); break; } return SERD_SUCCESS; @@ -526,7 +528,7 @@ read_anon(SerdReader* const reader, return r_err(reader, SERD_BAD_SYNTAX, "'.' inside blank"); } - read_ws_star(reader); + read_turtle_ws_star(reader); *ctx.flags = old_flags; TRY(st, serd_sink_write_end(reader->sink, *dest)); @@ -624,7 +626,7 @@ read_object(SerdReader* const reader, st = read_IRIREF(reader, &o); break; case ':': - st = read_iri(reader, &o, ate_dot); + st = read_turtle_iri(reader, &o, ate_dot); break; case '+': case '-': @@ -682,7 +684,8 @@ read_predicateObjectList(SerdReader* const reader, const size_t orig_stack_size = reader->stack.size; SerdStatus st = SERD_SUCCESS; - while (!(st = read_verb(reader, &ctx.predicate)) && read_ws_star(reader) && + while (!(st = read_verb(reader, &ctx.predicate)) && + read_turtle_ws_star(reader) && !(st = read_objectList(reader, ctx, ate_dot))) { if (*ate_dot) { serd_stack_pop_to(&reader->stack, orig_stack_size); @@ -692,7 +695,7 @@ read_predicateObjectList(SerdReader* const reader, bool ate_semi = false; int c = 0; do { - read_ws_star(reader); + read_turtle_ws_star(reader); switch (c = peek_byte(reader)) { case EOF: serd_stack_pop_to(&reader->stack, orig_stack_size); @@ -795,11 +798,11 @@ read_collection(SerdReader* const reader, return end_collection(reader, st); } -static SerdStatus -read_subject(SerdReader* const reader, - ReadContext ctx, - SerdNode** const dest, - int* const s_type) +SerdStatus +read_turtle_subject(SerdReader* const reader, + ReadContext ctx, + SerdNode** const dest, + int* const s_type) { SerdStatus st = SERD_SUCCESS; bool ate_dot = false; @@ -814,7 +817,7 @@ read_subject(SerdReader* const reader, st = read_BLANK_NODE_LABEL(reader, dest, &ate_dot); break; default: - TRY(st, read_iri(reader, dest, &ate_dot)); + TRY(st, read_turtle_iri(reader, dest, &ate_dot)); } if (ate_dot) { @@ -824,36 +827,14 @@ read_subject(SerdReader* const reader, return st; } -static SerdStatus -read_labelOrSubject(SerdReader* const reader, SerdNode** const dest) -{ - SerdStatus st = SERD_SUCCESS; - bool ate_dot = false; - - switch (peek_byte(reader)) { - case '[': - skip_byte(reader, '['); - read_ws_star(reader); - TRY(st, eat_byte_check(reader, ']')); - *dest = blank_id(reader); - return *dest ? SERD_SUCCESS : SERD_BAD_STACK; - case '_': - return read_BLANK_NODE_LABEL(reader, dest, &ate_dot); - default: - if (!read_iri(reader, dest, &ate_dot)) { - return SERD_SUCCESS; - } else { - return r_err(reader, SERD_BAD_SYNTAX, "expected label or subject"); - } - } -} - -static SerdStatus -read_triples(SerdReader* const reader, ReadContext ctx, bool* const ate_dot) +SerdStatus +read_turtle_triples(SerdReader* const reader, + ReadContext ctx, + bool* const ate_dot) { SerdStatus st = SERD_FAILURE; if (ctx.subject) { - read_ws_star(reader); + read_turtle_ws_star(reader); switch (peek_byte(reader)) { case '.': *ate_dot = eat_byte_safe(reader, '.'); @@ -868,15 +849,15 @@ read_triples(SerdReader* const reader, ReadContext ctx, bool* const ate_dot) return st > SERD_FAILURE ? st : SERD_SUCCESS; } -static SerdStatus -read_base(SerdReader* const reader, const bool sparql, const bool token) +SerdStatus +read_turtle_base(SerdReader* const reader, const bool sparql, const bool token) { SerdStatus st = SERD_SUCCESS; if (token) { TRY(st, eat_string(reader, "base", 4)); } - read_ws_star(reader); + read_turtle_ws_star(reader); SerdNode* uri = NULL; TRY(st, read_IRIREF(reader, &uri)); @@ -888,7 +869,7 @@ read_base(SerdReader* const reader, const bool sparql, const bool token) serd_node_zero_pad(uri); TRY(st, serd_sink_write_base(reader->sink, uri)); - read_ws_star(reader); + read_turtle_ws_star(reader); if (!sparql) { return eat_byte_check(reader, '.'); } @@ -900,15 +881,17 @@ read_base(SerdReader* const reader, const bool sparql, const bool token) return SERD_SUCCESS; } -static SerdStatus -read_prefixID(SerdReader* const reader, const bool sparql, const bool token) +SerdStatus +read_turtle_prefixID(SerdReader* const reader, + const bool sparql, + const bool token) { SerdStatus st = SERD_SUCCESS; if (token) { TRY(st, eat_string(reader, "prefix", 6)); } - read_ws_star(reader); + read_turtle_ws_star(reader); SerdNode* name = push_node(reader, SERD_LITERAL, "", 0); if (!name) { return SERD_BAD_STACK; @@ -917,7 +900,7 @@ read_prefixID(SerdReader* const reader, const bool sparql, const bool token) TRY_FAILING(st, read_PN_PREFIX(reader, name)); TRY(st, eat_byte_check(reader, ':')); - read_ws_star(reader); + read_turtle_ws_star(reader); SerdNode* uri = NULL; TRY(st, read_IRIREF(reader, &uri)); @@ -931,68 +914,22 @@ read_prefixID(SerdReader* const reader, const bool sparql, const bool token) st = serd_sink_write_prefix(reader->sink, name, uri); if (!sparql) { - read_ws_star(reader); + read_turtle_ws_star(reader); st = eat_byte_check(reader, '.'); } return st; } -static SerdStatus -read_wrappedGraph(SerdReader* const reader, ReadContext* const ctx) -{ - SerdStatus st = SERD_SUCCESS; - TRY(st, eat_byte_check(reader, '{')); - read_ws_star(reader); - - while (peek_byte(reader) != '}') { - const size_t orig_stack_size = reader->stack.size; - bool ate_dot = false; - int s_type = 0; - - ctx->subject = 0; - if ((st = read_subject(reader, *ctx, &ctx->subject, &s_type))) { - return r_err(reader, st, "expected subject"); - } - - if ((st = read_triples(reader, *ctx, &ate_dot)) && s_type != '[') { - return r_err(reader, st, "bad predicate object list"); - } - - serd_stack_pop_to(&reader->stack, orig_stack_size); - read_ws_star(reader); - if (peek_byte(reader) == '.') { - skip_byte(reader, '.'); - } - read_ws_star(reader); - } - - skip_byte(reader, '}'); - read_ws_star(reader); - if (peek_byte(reader) == '.') { - return r_err(reader, SERD_BAD_SYNTAX, "graph followed by '.'"); - } - - return SERD_SUCCESS; -} - -static int -tokcmp(const SerdNode* const node, const char* const tok, const size_t n) -{ - return ((!node || node->length != n) - ? -1 - : serd_strncasecmp(serd_node_string(node), tok, n)); -} - -static SerdStatus +SerdStatus read_turtle_directive(SerdReader* const reader) { skip_byte(reader, '@'); switch (peek_byte(reader)) { case 'b': - return read_base(reader, false, true); + return read_turtle_base(reader, false, true); case 'p': - return read_prefixID(reader, false, true); + return read_turtle_prefixID(reader, false, true); default: break; } @@ -1001,24 +938,14 @@ read_turtle_directive(SerdReader* const reader) } static SerdStatus -read_sparql_directive(SerdReader* const reader, - ReadContext* const ctx, - const SerdNode* const token) +read_sparql_directive(SerdReader* const reader, const SerdNode* const token) { if (!tokcmp(token, "base", 4)) { - return read_base(reader, true, false); + return read_turtle_base(reader, true, false); } if (!tokcmp(token, "prefix", 6)) { - return read_prefixID(reader, true, false); - } - - if (!tokcmp(token, "graph", 5)) { - SerdStatus st = SERD_SUCCESS; - read_ws_star(reader); - TRY(st, read_labelOrSubject(reader, &ctx->graph)); - read_ws_star(reader); - return read_wrappedGraph(reader, ctx); + return read_turtle_prefixID(reader, true, false); } return SERD_FAILURE; @@ -1032,26 +959,16 @@ read_block(SerdReader* const reader, ReadContext* const ctx) // Try to read a subject, though it may actually be a directive or graph name SerdNode* token = NULL; int s_type = 0; - if ((st = read_subject(reader, *ctx, &token, &s_type)) > SERD_FAILURE) { + if ((st = read_turtle_subject(reader, *ctx, &token, &s_type)) > + SERD_FAILURE) { return st; } // Try to interpret as a SPARQL "PREFIX" or "BASE" directive - if (st && (st = read_sparql_directive(reader, ctx, token)) != SERD_FAILURE) { + if (st && (st = read_sparql_directive(reader, token)) != SERD_FAILURE) { return st; } - // Try to interpret as a named TriG graph like "graphname { ..." - read_ws_star(reader); - if (peek_byte(reader) == '{') { - if (s_type == '(' || (s_type == '[' && !*ctx->flags)) { - return r_err(reader, SERD_BAD_SYNTAX, "invalid graph name"); - } - - ctx->graph = token; - return read_wrappedGraph(reader, ctx); - } - if (st) { return r_err(reader, SERD_BAD_SYNTAX, "expected directive or subject"); } @@ -1059,7 +976,7 @@ read_block(SerdReader* const reader, ReadContext* const ctx) // Our token is really a subject, read some triples bool ate_dot = false; ctx->subject = token; - if ((st = read_triples(reader, *ctx, &ate_dot)) > SERD_FAILURE) { + if ((st = read_turtle_triples(reader, *ctx, &ate_dot)) > SERD_FAILURE) { return st; } @@ -1073,13 +990,13 @@ read_block(SerdReader* const reader, ReadContext* const ctx) } SerdStatus -read_n3_statement(SerdReader* const reader) +read_turtle_statement(SerdReader* const reader) { SerdStatementFlags flags = 0; ReadContext ctx = {0, 0, 0, 0, &flags}; // Handle nice cases we can distinguish from the next byte - read_ws_star(reader); + read_turtle_ws_star(reader); switch (peek_byte(reader)) { case EOF: return SERD_FAILURE; @@ -1091,11 +1008,6 @@ read_n3_statement(SerdReader* const reader) case '@': return read_turtle_directive(reader); - case '{': - return (reader->syntax == SERD_TRIG) - ? read_wrappedGraph(reader, &ctx) - : r_err(reader, SERD_BAD_SYNTAX, "syntax does not support graphs"); - default: break; } @@ -1105,11 +1017,11 @@ read_n3_statement(SerdReader* const reader) } SerdStatus -read_turtleTrigDoc(SerdReader* const reader) +read_turtleDoc(SerdReader* const reader) { while (!reader->source.eof) { const size_t orig_stack_size = reader->stack.size; - const SerdStatus st = read_n3_statement(reader); + const SerdStatus st = read_turtle_statement(reader); if (st > SERD_FAILURE) { if (!tolerate_status(reader, st)) { diff --git a/src/read_turtle.h b/src/read_turtle.h new file mode 100644 index 00000000..be3d961c --- /dev/null +++ b/src/read_turtle.h @@ -0,0 +1,89 @@ +// Copyright 2011-2021 David Robillard <d@drobilla.net> +// SPDX-License-Identifier: ISC + +#ifndef SERD_SRC_READ_TURTLE_H +#define SERD_SRC_READ_TURTLE_H + +#include "reader.h" + +#include "serd/node.h" +#include "serd/reader.h" +#include "serd/status.h" + +#include <stdbool.h> + +/** + Read (skip) any amount of whitespace. + + RDF 1.1 Turtle: [161s] WS (but here with a *) +*/ +bool +read_turtle_ws_star(SerdReader* reader); + +// Nonterminals + +/** + Read a Turtle prefix or base directive. + + RDF 1.1 Turtle: [4] prefixId and [5] base +*/ +SerdStatus +read_turtle_directive(SerdReader* reader); + +/** + Read a Turtle base directive. + + RDF 1.1 Turtle: [5] base +*/ +SerdStatus +read_turtle_base(SerdReader* reader, bool sparql, bool token); + +/** + Read a Turtle prefixID directive. + + RDF 1.1 Turtle: [4] prefixID +*/ +SerdStatus +read_turtle_prefixID(SerdReader* reader, bool sparql, bool token); + +/** + Read a Turtle IRI node. + + RDF 1.1 Turtle: [135s] iri +*/ +SerdStatus +read_turtle_iri(SerdReader* reader, SerdNode** dest, bool* ate_dot); + +/** + Read a Turtle subject node. + + RDF 1.1 Turtle: [10] subject +*/ +SerdStatus +read_turtle_subject(SerdReader* reader, + ReadContext ctx, + SerdNode** dest, + int* s_type); +/** + Read a single Turtle statement. +*/ +SerdStatus +read_turtle_statement(SerdReader* reader); + +/** + Read a series of Turtle triples. + + RDF 1.1 Turtle: [6] triples +*/ +SerdStatus +read_turtle_triples(SerdReader* reader, ReadContext ctx, bool* ate_dot); + +/** + Read a complete Turtle document. + + RDF 1.1 Turtle: [1] turtleDoc +*/ +SerdStatus +read_turtleDoc(SerdReader* reader); + +#endif // SERD_SRC_READ_TURTLE_H diff --git a/src/reader.c b/src/reader.c index 1c99b033..d7c87c47 100644 --- a/src/reader.c +++ b/src/reader.c @@ -8,8 +8,11 @@ #include "node.h" #include "read_nquads.h" #include "read_ntriples.h" +#include "read_trig.h" +#include "read_turtle.h" #include "stack.h" #include "statement.h" +#include "string_utils.h" #include "system.h" #include "world.h" @@ -149,6 +152,14 @@ push_node(SerdReader* const reader, return push_node_padded(reader, length, type, str, length); } +int +tokcmp(const SerdNode* const node, const char* const tok, const size_t n) +{ + return ((!node || node->length != n) + ? -1 + : serd_strncasecmp(serd_node_string(node), tok, n)); +} + SerdStatus emit_statement(SerdReader* const reader, const ReadContext ctx, @@ -188,13 +199,13 @@ serd_reader_read_document(SerdReader* const reader) case SERD_SYNTAX_EMPTY: break; case SERD_TURTLE: - return read_turtleTrigDoc(reader); + return read_turtleDoc(reader); case SERD_NTRIPLES: return read_ntriplesDoc(reader); case SERD_NQUADS: return read_nquadsDoc(reader); case SERD_TRIG: - return read_turtleTrigDoc(reader); + return read_trigDoc(reader); } return SERD_SUCCESS; @@ -367,9 +378,23 @@ serd_reader_read_chunk(SerdReader* const reader) return SERD_FAILURE; } - return st ? st - : (reader->syntax == SERD_NQUADS) ? read_nquads_line(reader) - : read_n3_statement(reader); + if (st) { + return st; + } + + switch (reader->syntax) { + case SERD_SYNTAX_EMPTY: + break; + case SERD_TURTLE: + case SERD_NTRIPLES: + return read_turtle_statement(reader); + case SERD_NQUADS: + return read_nquads_line(reader); + case SERD_TRIG: + return read_trig_statement(reader); + } + + return SERD_FAILURE; } SerdStatus diff --git a/src/reader.h b/src/reader.h index 0907d4cc..7bd4ff95 100644 --- a/src/reader.h +++ b/src/reader.h @@ -72,6 +72,9 @@ push_node(SerdReader* reader, const char* str, size_t length); +ZIX_PURE_FUNC int +tokcmp(const SerdNode* node, const char* tok, size_t n); + ZIX_PURE_FUNC size_t genid_length(const SerdReader* reader); @@ -87,12 +90,6 @@ set_blank_id(SerdReader* reader, SerdNode* node, size_t buf_size); SerdStatus emit_statement(SerdReader* reader, ReadContext ctx, SerdNode* o); -SerdStatus -read_n3_statement(SerdReader* reader); - -SerdStatus -read_turtleTrigDoc(SerdReader* reader); - static inline int peek_byte(SerdReader* reader) { diff --git a/test/test_syntax.c b/test/test_syntax.c index 19f4a463..c2de8526 100644 --- a/test/test_syntax.c +++ b/test/test_syntax.c @@ -4,6 +4,7 @@ #undef NDEBUG #include "serd/syntax.h" +#include "zix/attributes.h" #include <assert.h> @@ -49,7 +50,7 @@ test_syntax_has_graphs(void) assert(serd_syntax_has_graphs(SERD_TRIG)); } -int +ZIX_PURE_FUNC int main(void) { test_syntax_by_name(); |