aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorDavid Robillard <d@drobilla.net>2023-09-10 13:39:56 -0400
committerDavid Robillard <d@drobilla.net>2023-12-02 18:49:07 -0500
commitd80b2a1c153f81685d026f8e09c12175abed3d03 (patch)
tree8207788e58ee9de94ca224433a02a88e8fed3801
parent76fabe903adb09e6fe4d084ff6be49115285e086 (diff)
downloadserd-d80b2a1c153f81685d026f8e09c12175abed3d03.tar.gz
serd-d80b2a1c153f81685d026f8e09c12175abed3d03.tar.bz2
serd-d80b2a1c153f81685d026f8e09c12175abed3d03.zip
Separate Turtle and TriG reading code
-rw-r--r--include/serd/world.h2
-rw-r--r--meson.build3
-rw-r--r--src/read_trig.c203
-rw-r--r--src/read_trig.h24
-rw-r--r--src/read_turtle.c (renamed from src/n3.c)190
-rw-r--r--src/read_turtle.h89
-rw-r--r--src/reader.c35
-rw-r--r--src/reader.h9
-rw-r--r--test/test_syntax.c3
9 files changed, 405 insertions, 153 deletions
diff --git a/include/serd/world.h b/include/serd/world.h
index 4c51df73..86e43bb1 100644
--- a/include/serd/world.h
+++ b/include/serd/world.h
@@ -51,7 +51,7 @@ serd_world_free(SerdWorld* ZIX_NULLABLE world);
a megabyte and over 100 levels of nesting, which is more than enough for
most data.
*/
-SERD_API SerdLimits
+SERD_PURE_API SerdLimits
serd_world_limits(const SerdWorld* ZIX_NONNULL world);
/**
diff --git a/meson.build b/meson.build
index df3f237f..366c8faf 100644
--- a/meson.build
+++ b/meson.build
@@ -155,10 +155,11 @@ sources = files(
'src/byte_source.c',
'src/caret.c',
'src/env.c',
- 'src/n3.c',
'src/node.c',
'src/read_nquads.c',
'src/read_ntriples.c',
+ 'src/read_trig.c',
+ 'src/read_turtle.c',
'src/read_utf8.c',
'src/reader.c',
'src/sink.c',
diff --git a/src/read_trig.c b/src/read_trig.c
new file mode 100644
index 00000000..45ac39a0
--- /dev/null
+++ b/src/read_trig.c
@@ -0,0 +1,203 @@
+// Copyright 2011-2023 David Robillard <d@drobilla.net>
+// SPDX-License-Identifier: ISC
+
+#include "read_trig.h"
+#include "read_ntriples.h"
+#include "read_turtle.h"
+#include "reader.h"
+#include "stack.h"
+#include "try.h"
+
+#include "serd/node.h"
+#include "serd/reader.h"
+#include "serd/statement.h"
+#include "serd/status.h"
+
+#include <stdbool.h>
+#include <stdio.h>
+
+static SerdStatus
+read_wrappedGraph(SerdReader* const reader, ReadContext* const ctx)
+{
+ SerdStatus st = SERD_SUCCESS;
+ TRY(st, eat_byte_check(reader, '{'));
+ read_turtle_ws_star(reader);
+
+ while (peek_byte(reader) != '}') {
+ const size_t orig_stack_size = reader->stack.size;
+ bool ate_dot = false;
+ int s_type = 0;
+
+ ctx->subject = 0;
+ if ((st = read_turtle_subject(reader, *ctx, &ctx->subject, &s_type))) {
+ return r_err(reader, st, "expected subject");
+ }
+
+ if ((st = read_turtle_triples(reader, *ctx, &ate_dot)) && s_type != '[') {
+ return r_err(reader, st, "bad predicate object list");
+ }
+
+ serd_stack_pop_to(&reader->stack, orig_stack_size);
+ read_turtle_ws_star(reader);
+ if (peek_byte(reader) == '.') {
+ skip_byte(reader, '.');
+ }
+ read_turtle_ws_star(reader);
+ }
+
+ skip_byte(reader, '}');
+ read_turtle_ws_star(reader);
+ if (peek_byte(reader) == '.') {
+ return r_err(reader, SERD_BAD_SYNTAX, "graph followed by '.'");
+ }
+
+ return SERD_SUCCESS;
+}
+
+static SerdStatus
+read_labelOrSubject(SerdReader* const reader, SerdNode** const dest)
+{
+ SerdStatus st = SERD_SUCCESS;
+ bool ate_dot = false;
+
+ switch (peek_byte(reader)) {
+ case '[':
+ skip_byte(reader, '[');
+ read_turtle_ws_star(reader);
+ TRY(st, eat_byte_check(reader, ']'));
+ *dest = blank_id(reader);
+ return *dest ? SERD_SUCCESS : SERD_BAD_STACK;
+ case '_':
+ return read_BLANK_NODE_LABEL(reader, dest, &ate_dot);
+ default:
+ if (!read_turtle_iri(reader, dest, &ate_dot)) {
+ return SERD_SUCCESS;
+ } else {
+ return r_err(reader, SERD_BAD_SYNTAX, "expected label or subject");
+ }
+ }
+}
+
+static SerdStatus
+read_sparql_directive(SerdReader* const reader,
+ ReadContext* const ctx,
+ const SerdNode* const token)
+{
+ if (!tokcmp(token, "base", 4)) {
+ return read_turtle_base(reader, true, false);
+ }
+
+ if (!tokcmp(token, "prefix", 6)) {
+ return read_turtle_prefixID(reader, true, false);
+ }
+
+ if (!tokcmp(token, "graph", 5)) {
+ SerdStatus st = SERD_SUCCESS;
+ read_turtle_ws_star(reader);
+ TRY(st, read_labelOrSubject(reader, &ctx->graph));
+ read_turtle_ws_star(reader);
+ return read_wrappedGraph(reader, ctx);
+ }
+
+ return SERD_FAILURE;
+}
+
+static SerdStatus
+read_block(SerdReader* const reader, ReadContext* const ctx)
+{
+ SerdStatus st = SERD_SUCCESS;
+
+ // Try to read a subject, though it may actually be a directive or graph name
+ SerdNode* token = NULL;
+ int s_type = 0;
+ if ((st = read_turtle_subject(reader, *ctx, &token, &s_type)) >
+ SERD_FAILURE) {
+ return st;
+ }
+
+ // Try to interpret as a SPARQL "PREFIX" or "BASE" directive
+ if (st && (st = read_sparql_directive(reader, ctx, token)) != SERD_FAILURE) {
+ return st;
+ }
+
+ // Try to interpret as a named TriG graph like "graphname { ..."
+ read_turtle_ws_star(reader);
+ if (peek_byte(reader) == '{') {
+ if (s_type == '(' || (s_type == '[' && !*ctx->flags)) {
+ return r_err(reader, SERD_BAD_SYNTAX, "invalid graph name");
+ }
+
+ ctx->graph = token;
+ return read_wrappedGraph(reader, ctx);
+ }
+
+ if (st) {
+ return r_err(reader, SERD_BAD_SYNTAX, "expected directive or subject");
+ }
+
+ // Our token is really a subject, read some triples
+ bool ate_dot = false;
+ ctx->subject = token;
+ if ((st = read_turtle_triples(reader, *ctx, &ate_dot)) > SERD_FAILURE) {
+ return st;
+ }
+
+ // "Failure" is only allowed for anonymous subjects like "[ ... ] ."
+ if (st && s_type != '[') {
+ return r_err(reader, SERD_BAD_SYNTAX, "expected triples");
+ }
+
+ // Ensure that triples are properly terminated
+ return ate_dot ? st : eat_byte_check(reader, '.');
+}
+
+SerdStatus
+read_trig_statement(SerdReader* const reader)
+{
+ SerdStatementFlags flags = 0;
+ ReadContext ctx = {0, 0, 0, 0, &flags};
+
+ // Handle nice cases we can distinguish from the next byte
+ read_turtle_ws_star(reader);
+ switch (peek_byte(reader)) {
+ case EOF:
+ return SERD_FAILURE;
+
+ case '\0':
+ eat_byte(reader);
+ return SERD_FAILURE;
+
+ case '@':
+ return read_turtle_directive(reader);
+
+ case '{':
+ return read_wrappedGraph(reader, &ctx);
+
+ default:
+ break;
+ }
+
+ // No such luck, figure out what to read from the first token
+ return read_block(reader, &ctx);
+}
+
+SerdStatus
+read_trigDoc(SerdReader* const reader)
+{
+ while (!reader->source.eof) {
+ const size_t orig_stack_size = reader->stack.size;
+ const SerdStatus st = read_trig_statement(reader);
+
+ if (st > SERD_FAILURE) {
+ if (!tolerate_status(reader, st)) {
+ serd_stack_pop_to(&reader->stack, orig_stack_size);
+ return st;
+ }
+ serd_reader_skip_until_byte(reader, '\n');
+ }
+
+ serd_stack_pop_to(&reader->stack, orig_stack_size);
+ }
+
+ return SERD_SUCCESS;
+}
diff --git a/src/read_trig.h b/src/read_trig.h
new file mode 100644
index 00000000..a73f39d1
--- /dev/null
+++ b/src/read_trig.h
@@ -0,0 +1,24 @@
+// Copyright 2011-2023 David Robillard <d@drobilla.net>
+// SPDX-License-Identifier: ISC
+
+#ifndef SERD_SRC_READ_TRIG_H
+#define SERD_SRC_READ_TRIG_H
+
+#include "serd/reader.h"
+#include "serd/status.h"
+
+/**
+ Read a single TriG statement.
+*/
+SerdStatus
+read_trig_statement(SerdReader* reader);
+
+/**
+ Read a complete TriG document.
+
+ RDF 1.1 Trig: [1] trigDoc
+*/
+SerdStatus
+read_trigDoc(SerdReader* reader);
+
+#endif // SERD_SRC_READ_TRIG_H
diff --git a/src/n3.c b/src/read_turtle.c
index b731feaf..ef76c858 100644
--- a/src/n3.c
+++ b/src/read_turtle.c
@@ -1,6 +1,7 @@
// Copyright 2011-2023 David Robillard <d@drobilla.net>
// SPDX-License-Identifier: ISC
+#include "read_turtle.h"
#include "byte_source.h"
#include "namespaces.h"
#include "node.h"
@@ -18,7 +19,6 @@
#include "serd/statement.h"
#include "serd/status.h"
#include "serd/string_view.h"
-#include "serd/syntax.h"
#include <assert.h>
#include <stdbool.h>
@@ -51,8 +51,8 @@ read_whitespace(SerdReader* const reader)
return SERD_FAILURE;
}
-static bool
-read_ws_star(SerdReader* const reader)
+bool
+read_turtle_ws_star(SerdReader* const reader)
{
while (!read_whitespace(reader)) {
}
@@ -63,7 +63,7 @@ read_ws_star(SerdReader* const reader)
static bool
peek_delim(SerdReader* const reader, const uint8_t delim)
{
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
return peek_byte(reader) == delim;
}
@@ -72,7 +72,7 @@ eat_delim(SerdReader* const reader, const uint8_t delim)
{
if (peek_delim(reader, delim)) {
skip_byte(reader, delim);
- return read_ws_star(reader);
+ return read_turtle_ws_star(reader);
}
return false;
@@ -403,8 +403,10 @@ read_number(SerdReader* const reader,
return meta ? SERD_SUCCESS : SERD_BAD_STACK;
}
-static SerdStatus
-read_iri(SerdReader* const reader, SerdNode** const dest, bool* const ate_dot)
+SerdStatus
+read_turtle_iri(SerdReader* const reader,
+ SerdNode** const dest,
+ bool* const ate_dot)
{
switch (peek_byte(reader)) {
case '<':
@@ -441,7 +443,7 @@ read_literal(SerdReader* const reader,
skip_byte(reader, '^');
TRY(st, eat_byte_check(reader, '^'));
(*dest)->flags |= SERD_HAS_DATATYPE;
- TRY(st, read_iri(reader, &datatype, ate_dot));
+ TRY(st, read_turtle_iri(reader, &datatype, ate_dot));
break;
}
return SERD_SUCCESS;
@@ -526,7 +528,7 @@ read_anon(SerdReader* const reader,
return r_err(reader, SERD_BAD_SYNTAX, "'.' inside blank");
}
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
*ctx.flags = old_flags;
TRY(st, serd_sink_write_end(reader->sink, *dest));
@@ -624,7 +626,7 @@ read_object(SerdReader* const reader,
st = read_IRIREF(reader, &o);
break;
case ':':
- st = read_iri(reader, &o, ate_dot);
+ st = read_turtle_iri(reader, &o, ate_dot);
break;
case '+':
case '-':
@@ -682,7 +684,8 @@ read_predicateObjectList(SerdReader* const reader,
const size_t orig_stack_size = reader->stack.size;
SerdStatus st = SERD_SUCCESS;
- while (!(st = read_verb(reader, &ctx.predicate)) && read_ws_star(reader) &&
+ while (!(st = read_verb(reader, &ctx.predicate)) &&
+ read_turtle_ws_star(reader) &&
!(st = read_objectList(reader, ctx, ate_dot))) {
if (*ate_dot) {
serd_stack_pop_to(&reader->stack, orig_stack_size);
@@ -692,7 +695,7 @@ read_predicateObjectList(SerdReader* const reader,
bool ate_semi = false;
int c = 0;
do {
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
switch (c = peek_byte(reader)) {
case EOF:
serd_stack_pop_to(&reader->stack, orig_stack_size);
@@ -795,11 +798,11 @@ read_collection(SerdReader* const reader,
return end_collection(reader, st);
}
-static SerdStatus
-read_subject(SerdReader* const reader,
- ReadContext ctx,
- SerdNode** const dest,
- int* const s_type)
+SerdStatus
+read_turtle_subject(SerdReader* const reader,
+ ReadContext ctx,
+ SerdNode** const dest,
+ int* const s_type)
{
SerdStatus st = SERD_SUCCESS;
bool ate_dot = false;
@@ -814,7 +817,7 @@ read_subject(SerdReader* const reader,
st = read_BLANK_NODE_LABEL(reader, dest, &ate_dot);
break;
default:
- TRY(st, read_iri(reader, dest, &ate_dot));
+ TRY(st, read_turtle_iri(reader, dest, &ate_dot));
}
if (ate_dot) {
@@ -824,36 +827,14 @@ read_subject(SerdReader* const reader,
return st;
}
-static SerdStatus
-read_labelOrSubject(SerdReader* const reader, SerdNode** const dest)
-{
- SerdStatus st = SERD_SUCCESS;
- bool ate_dot = false;
-
- switch (peek_byte(reader)) {
- case '[':
- skip_byte(reader, '[');
- read_ws_star(reader);
- TRY(st, eat_byte_check(reader, ']'));
- *dest = blank_id(reader);
- return *dest ? SERD_SUCCESS : SERD_BAD_STACK;
- case '_':
- return read_BLANK_NODE_LABEL(reader, dest, &ate_dot);
- default:
- if (!read_iri(reader, dest, &ate_dot)) {
- return SERD_SUCCESS;
- } else {
- return r_err(reader, SERD_BAD_SYNTAX, "expected label or subject");
- }
- }
-}
-
-static SerdStatus
-read_triples(SerdReader* const reader, ReadContext ctx, bool* const ate_dot)
+SerdStatus
+read_turtle_triples(SerdReader* const reader,
+ ReadContext ctx,
+ bool* const ate_dot)
{
SerdStatus st = SERD_FAILURE;
if (ctx.subject) {
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
switch (peek_byte(reader)) {
case '.':
*ate_dot = eat_byte_safe(reader, '.');
@@ -868,15 +849,15 @@ read_triples(SerdReader* const reader, ReadContext ctx, bool* const ate_dot)
return st > SERD_FAILURE ? st : SERD_SUCCESS;
}
-static SerdStatus
-read_base(SerdReader* const reader, const bool sparql, const bool token)
+SerdStatus
+read_turtle_base(SerdReader* const reader, const bool sparql, const bool token)
{
SerdStatus st = SERD_SUCCESS;
if (token) {
TRY(st, eat_string(reader, "base", 4));
}
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
SerdNode* uri = NULL;
TRY(st, read_IRIREF(reader, &uri));
@@ -888,7 +869,7 @@ read_base(SerdReader* const reader, const bool sparql, const bool token)
serd_node_zero_pad(uri);
TRY(st, serd_sink_write_base(reader->sink, uri));
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
if (!sparql) {
return eat_byte_check(reader, '.');
}
@@ -900,15 +881,17 @@ read_base(SerdReader* const reader, const bool sparql, const bool token)
return SERD_SUCCESS;
}
-static SerdStatus
-read_prefixID(SerdReader* const reader, const bool sparql, const bool token)
+SerdStatus
+read_turtle_prefixID(SerdReader* const reader,
+ const bool sparql,
+ const bool token)
{
SerdStatus st = SERD_SUCCESS;
if (token) {
TRY(st, eat_string(reader, "prefix", 6));
}
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
SerdNode* name = push_node(reader, SERD_LITERAL, "", 0);
if (!name) {
return SERD_BAD_STACK;
@@ -917,7 +900,7 @@ read_prefixID(SerdReader* const reader, const bool sparql, const bool token)
TRY_FAILING(st, read_PN_PREFIX(reader, name));
TRY(st, eat_byte_check(reader, ':'));
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
SerdNode* uri = NULL;
TRY(st, read_IRIREF(reader, &uri));
@@ -931,68 +914,22 @@ read_prefixID(SerdReader* const reader, const bool sparql, const bool token)
st = serd_sink_write_prefix(reader->sink, name, uri);
if (!sparql) {
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
st = eat_byte_check(reader, '.');
}
return st;
}
-static SerdStatus
-read_wrappedGraph(SerdReader* const reader, ReadContext* const ctx)
-{
- SerdStatus st = SERD_SUCCESS;
- TRY(st, eat_byte_check(reader, '{'));
- read_ws_star(reader);
-
- while (peek_byte(reader) != '}') {
- const size_t orig_stack_size = reader->stack.size;
- bool ate_dot = false;
- int s_type = 0;
-
- ctx->subject = 0;
- if ((st = read_subject(reader, *ctx, &ctx->subject, &s_type))) {
- return r_err(reader, st, "expected subject");
- }
-
- if ((st = read_triples(reader, *ctx, &ate_dot)) && s_type != '[') {
- return r_err(reader, st, "bad predicate object list");
- }
-
- serd_stack_pop_to(&reader->stack, orig_stack_size);
- read_ws_star(reader);
- if (peek_byte(reader) == '.') {
- skip_byte(reader, '.');
- }
- read_ws_star(reader);
- }
-
- skip_byte(reader, '}');
- read_ws_star(reader);
- if (peek_byte(reader) == '.') {
- return r_err(reader, SERD_BAD_SYNTAX, "graph followed by '.'");
- }
-
- return SERD_SUCCESS;
-}
-
-static int
-tokcmp(const SerdNode* const node, const char* const tok, const size_t n)
-{
- return ((!node || node->length != n)
- ? -1
- : serd_strncasecmp(serd_node_string(node), tok, n));
-}
-
-static SerdStatus
+SerdStatus
read_turtle_directive(SerdReader* const reader)
{
skip_byte(reader, '@');
switch (peek_byte(reader)) {
case 'b':
- return read_base(reader, false, true);
+ return read_turtle_base(reader, false, true);
case 'p':
- return read_prefixID(reader, false, true);
+ return read_turtle_prefixID(reader, false, true);
default:
break;
}
@@ -1001,24 +938,14 @@ read_turtle_directive(SerdReader* const reader)
}
static SerdStatus
-read_sparql_directive(SerdReader* const reader,
- ReadContext* const ctx,
- const SerdNode* const token)
+read_sparql_directive(SerdReader* const reader, const SerdNode* const token)
{
if (!tokcmp(token, "base", 4)) {
- return read_base(reader, true, false);
+ return read_turtle_base(reader, true, false);
}
if (!tokcmp(token, "prefix", 6)) {
- return read_prefixID(reader, true, false);
- }
-
- if (!tokcmp(token, "graph", 5)) {
- SerdStatus st = SERD_SUCCESS;
- read_ws_star(reader);
- TRY(st, read_labelOrSubject(reader, &ctx->graph));
- read_ws_star(reader);
- return read_wrappedGraph(reader, ctx);
+ return read_turtle_prefixID(reader, true, false);
}
return SERD_FAILURE;
@@ -1032,26 +959,16 @@ read_block(SerdReader* const reader, ReadContext* const ctx)
// Try to read a subject, though it may actually be a directive or graph name
SerdNode* token = NULL;
int s_type = 0;
- if ((st = read_subject(reader, *ctx, &token, &s_type)) > SERD_FAILURE) {
+ if ((st = read_turtle_subject(reader, *ctx, &token, &s_type)) >
+ SERD_FAILURE) {
return st;
}
// Try to interpret as a SPARQL "PREFIX" or "BASE" directive
- if (st && (st = read_sparql_directive(reader, ctx, token)) != SERD_FAILURE) {
+ if (st && (st = read_sparql_directive(reader, token)) != SERD_FAILURE) {
return st;
}
- // Try to interpret as a named TriG graph like "graphname { ..."
- read_ws_star(reader);
- if (peek_byte(reader) == '{') {
- if (s_type == '(' || (s_type == '[' && !*ctx->flags)) {
- return r_err(reader, SERD_BAD_SYNTAX, "invalid graph name");
- }
-
- ctx->graph = token;
- return read_wrappedGraph(reader, ctx);
- }
-
if (st) {
return r_err(reader, SERD_BAD_SYNTAX, "expected directive or subject");
}
@@ -1059,7 +976,7 @@ read_block(SerdReader* const reader, ReadContext* const ctx)
// Our token is really a subject, read some triples
bool ate_dot = false;
ctx->subject = token;
- if ((st = read_triples(reader, *ctx, &ate_dot)) > SERD_FAILURE) {
+ if ((st = read_turtle_triples(reader, *ctx, &ate_dot)) > SERD_FAILURE) {
return st;
}
@@ -1073,13 +990,13 @@ read_block(SerdReader* const reader, ReadContext* const ctx)
}
SerdStatus
-read_n3_statement(SerdReader* const reader)
+read_turtle_statement(SerdReader* const reader)
{
SerdStatementFlags flags = 0;
ReadContext ctx = {0, 0, 0, 0, &flags};
// Handle nice cases we can distinguish from the next byte
- read_ws_star(reader);
+ read_turtle_ws_star(reader);
switch (peek_byte(reader)) {
case EOF:
return SERD_FAILURE;
@@ -1091,11 +1008,6 @@ read_n3_statement(SerdReader* const reader)
case '@':
return read_turtle_directive(reader);
- case '{':
- return (reader->syntax == SERD_TRIG)
- ? read_wrappedGraph(reader, &ctx)
- : r_err(reader, SERD_BAD_SYNTAX, "syntax does not support graphs");
-
default:
break;
}
@@ -1105,11 +1017,11 @@ read_n3_statement(SerdReader* const reader)
}
SerdStatus
-read_turtleTrigDoc(SerdReader* const reader)
+read_turtleDoc(SerdReader* const reader)
{
while (!reader->source.eof) {
const size_t orig_stack_size = reader->stack.size;
- const SerdStatus st = read_n3_statement(reader);
+ const SerdStatus st = read_turtle_statement(reader);
if (st > SERD_FAILURE) {
if (!tolerate_status(reader, st)) {
diff --git a/src/read_turtle.h b/src/read_turtle.h
new file mode 100644
index 00000000..be3d961c
--- /dev/null
+++ b/src/read_turtle.h
@@ -0,0 +1,89 @@
+// Copyright 2011-2021 David Robillard <d@drobilla.net>
+// SPDX-License-Identifier: ISC
+
+#ifndef SERD_SRC_READ_TURTLE_H
+#define SERD_SRC_READ_TURTLE_H
+
+#include "reader.h"
+
+#include "serd/node.h"
+#include "serd/reader.h"
+#include "serd/status.h"
+
+#include <stdbool.h>
+
+/**
+ Read (skip) any amount of whitespace.
+
+ RDF 1.1 Turtle: [161s] WS (but here with a *)
+*/
+bool
+read_turtle_ws_star(SerdReader* reader);
+
+// Nonterminals
+
+/**
+ Read a Turtle prefix or base directive.
+
+ RDF 1.1 Turtle: [4] prefixId and [5] base
+*/
+SerdStatus
+read_turtle_directive(SerdReader* reader);
+
+/**
+ Read a Turtle base directive.
+
+ RDF 1.1 Turtle: [5] base
+*/
+SerdStatus
+read_turtle_base(SerdReader* reader, bool sparql, bool token);
+
+/**
+ Read a Turtle prefixID directive.
+
+ RDF 1.1 Turtle: [4] prefixID
+*/
+SerdStatus
+read_turtle_prefixID(SerdReader* reader, bool sparql, bool token);
+
+/**
+ Read a Turtle IRI node.
+
+ RDF 1.1 Turtle: [135s] iri
+*/
+SerdStatus
+read_turtle_iri(SerdReader* reader, SerdNode** dest, bool* ate_dot);
+
+/**
+ Read a Turtle subject node.
+
+ RDF 1.1 Turtle: [10] subject
+*/
+SerdStatus
+read_turtle_subject(SerdReader* reader,
+ ReadContext ctx,
+ SerdNode** dest,
+ int* s_type);
+/**
+ Read a single Turtle statement.
+*/
+SerdStatus
+read_turtle_statement(SerdReader* reader);
+
+/**
+ Read a series of Turtle triples.
+
+ RDF 1.1 Turtle: [6] triples
+*/
+SerdStatus
+read_turtle_triples(SerdReader* reader, ReadContext ctx, bool* ate_dot);
+
+/**
+ Read a complete Turtle document.
+
+ RDF 1.1 Turtle: [1] turtleDoc
+*/
+SerdStatus
+read_turtleDoc(SerdReader* reader);
+
+#endif // SERD_SRC_READ_TURTLE_H
diff --git a/src/reader.c b/src/reader.c
index 1c99b033..d7c87c47 100644
--- a/src/reader.c
+++ b/src/reader.c
@@ -8,8 +8,11 @@
#include "node.h"
#include "read_nquads.h"
#include "read_ntriples.h"
+#include "read_trig.h"
+#include "read_turtle.h"
#include "stack.h"
#include "statement.h"
+#include "string_utils.h"
#include "system.h"
#include "world.h"
@@ -149,6 +152,14 @@ push_node(SerdReader* const reader,
return push_node_padded(reader, length, type, str, length);
}
+int
+tokcmp(const SerdNode* const node, const char* const tok, const size_t n)
+{
+ return ((!node || node->length != n)
+ ? -1
+ : serd_strncasecmp(serd_node_string(node), tok, n));
+}
+
SerdStatus
emit_statement(SerdReader* const reader,
const ReadContext ctx,
@@ -188,13 +199,13 @@ serd_reader_read_document(SerdReader* const reader)
case SERD_SYNTAX_EMPTY:
break;
case SERD_TURTLE:
- return read_turtleTrigDoc(reader);
+ return read_turtleDoc(reader);
case SERD_NTRIPLES:
return read_ntriplesDoc(reader);
case SERD_NQUADS:
return read_nquadsDoc(reader);
case SERD_TRIG:
- return read_turtleTrigDoc(reader);
+ return read_trigDoc(reader);
}
return SERD_SUCCESS;
@@ -367,9 +378,23 @@ serd_reader_read_chunk(SerdReader* const reader)
return SERD_FAILURE;
}
- return st ? st
- : (reader->syntax == SERD_NQUADS) ? read_nquads_line(reader)
- : read_n3_statement(reader);
+ if (st) {
+ return st;
+ }
+
+ switch (reader->syntax) {
+ case SERD_SYNTAX_EMPTY:
+ break;
+ case SERD_TURTLE:
+ case SERD_NTRIPLES:
+ return read_turtle_statement(reader);
+ case SERD_NQUADS:
+ return read_nquads_line(reader);
+ case SERD_TRIG:
+ return read_trig_statement(reader);
+ }
+
+ return SERD_FAILURE;
}
SerdStatus
diff --git a/src/reader.h b/src/reader.h
index 0907d4cc..7bd4ff95 100644
--- a/src/reader.h
+++ b/src/reader.h
@@ -72,6 +72,9 @@ push_node(SerdReader* reader,
const char* str,
size_t length);
+ZIX_PURE_FUNC int
+tokcmp(const SerdNode* node, const char* tok, size_t n);
+
ZIX_PURE_FUNC size_t
genid_length(const SerdReader* reader);
@@ -87,12 +90,6 @@ set_blank_id(SerdReader* reader, SerdNode* node, size_t buf_size);
SerdStatus
emit_statement(SerdReader* reader, ReadContext ctx, SerdNode* o);
-SerdStatus
-read_n3_statement(SerdReader* reader);
-
-SerdStatus
-read_turtleTrigDoc(SerdReader* reader);
-
static inline int
peek_byte(SerdReader* reader)
{
diff --git a/test/test_syntax.c b/test/test_syntax.c
index 19f4a463..c2de8526 100644
--- a/test/test_syntax.c
+++ b/test/test_syntax.c
@@ -4,6 +4,7 @@
#undef NDEBUG
#include "serd/syntax.h"
+#include "zix/attributes.h"
#include <assert.h>
@@ -49,7 +50,7 @@ test_syntax_has_graphs(void)
assert(serd_syntax_has_graphs(SERD_TRIG));
}
-int
+ZIX_PURE_FUNC int
main(void)
{
test_syntax_by_name();