aboutsummaryrefslogtreecommitdiffstats
path: root/src/writer.c
diff options
context:
space:
mode:
authorDavid Robillard <d@drobilla.net>2011-01-21 01:52:11 +0000
committerDavid Robillard <d@drobilla.net>2011-01-21 01:52:11 +0000
commitc5a3f407cb46797f8b122d2f3843d382760a2c3b (patch)
tree106ad1d47987347308cc0db7deb8eaaf00ecde40 /src/writer.c
parent235eef1849b96bad3697f44c022f7a4e986299ff (diff)
downloadserd-c5a3f407cb46797f8b122d2f3843d382760a2c3b.tar.gz
serd-c5a3f407cb46797f8b122d2f3843d382760a2c3b.tar.bz2
serd-c5a3f407cb46797f8b122d2f3843d382760a2c3b.zip
Rename write.c to writer.c for consistency.
git-svn-id: http://svn.drobilla.net/serd/trunk@21 490d8e77-9747-427b-9fa3-0b8f29cee8a0
Diffstat (limited to 'src/writer.c')
-rw-r--r--src/writer.c223
1 files changed, 223 insertions, 0 deletions
diff --git a/src/writer.c b/src/writer.c
new file mode 100644
index 00000000..ef10594b
--- /dev/null
+++ b/src/writer.c
@@ -0,0 +1,223 @@
+/* Serd, an RDF serialisation library.
+ * Copyright 2011 David Robillard <d@drobilla.net>
+ *
+ * Serd is free software: you can redistribute it and/or modify it under
+ * the terms of the GNU Lesser General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Serd is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
+ * License for details.
+ *
+ * You should have received a copy of the GNU Lesser General Public License
+ * along with this program. If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#include <assert.h>
+#include <stdio.h>
+#include <stdlib.h>
+
+#include "serd/serd.h"
+
+struct SerdWriterImpl {
+ SerdSyntax syntax;
+ SerdNamespaces ns;
+ SerdURI base_uri;
+ SerdSink sink;
+ void* stream;
+};
+
+static bool
+serd_write_ascii(SerdWriter writer, const uint8_t* utf8, size_t n_bytes, const uint8_t esc)
+{
+ char escape[10] = { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 };
+ for (size_t i = 0; i < n_bytes;) {
+ uint8_t in = utf8[i++];
+ switch (in) {
+ case '\\': writer->sink("\\\\", 2, writer->stream); continue;
+ case '\n': writer->sink("\\n", 2, writer->stream); continue;
+ case '\r': writer->sink("\\r", 2, writer->stream); continue;
+ case '\t': writer->sink("\\t", 2, writer->stream); continue;
+ case '"': if (esc == '"') { writer->sink("\\\"", 2, writer->stream); continue; }
+ default: break;
+ }
+
+ if (in == esc) {
+ sprintf(escape, "\\u%04X", esc);
+ writer->sink(escape, 6, writer->stream);
+ continue;
+ }
+
+ uint32_t c = 0;
+ size_t size = 0;
+ if ((in & 0x80) == 0) { // Starts with `0'
+ size = 1;
+ c = in & 0x7F;
+ if ((in >= 0x20) && (in <= 0x7E)) { // Printable ASCII
+ writer->sink(&in, 1, writer->stream);
+ continue;
+ }
+ } else if ((in & 0xE0) == 0xC0) { // Starts with `110'
+ size = 2;
+ c = in & 0x1F;
+ } else if ((in & 0xF0) == 0xE0) { // Starts with `1110'
+ size = 3;
+ c = in & 0x0F;
+ } else if ((in & 0xF8) == 0xF0) { // Starts with `11110'
+ size = 4;
+ c = in & 0x07;
+ } else if ((in & 0xFC) == 0xF8) { // Starts with `111110'
+ size = 5;
+ c = in & 0x03;
+ } else if ((in & 0xFE) == 0xFC) { // Starts with `1111110'
+ size = 6;
+ c = in & 0x01;
+ } else {
+ fprintf(stderr, "invalid UTF-8 at offset %zu: %X\n", i, in);
+ return false;
+ }
+
+#define READ_BYTE() do { \
+ assert(i < n_bytes); \
+ in = utf8[i++] & 0x3f; \
+ c <<= 6; \
+ c |= in; \
+ } while (0)
+
+ switch (size) {
+ case 6: READ_BYTE();
+ case 5: READ_BYTE();
+ case 4: READ_BYTE();
+ case 3: READ_BYTE();
+ case 2: READ_BYTE();
+ }
+
+ if (c < 0xFFFF) {
+ sprintf(escape, "\\u%04X", c);
+ writer->sink(escape, 6, writer->stream);
+ } else {
+ sprintf(escape, "\\U%08X", c);
+ writer->sink(escape, 10, writer->stream);
+ }
+ }
+ return true;
+}
+
+static bool
+serd_write_node(SerdWriter writer,
+ SerdNodeType type,
+ const SerdString* str,
+ const SerdString* datatype,
+ const SerdString* lang)
+{
+ const SerdURI* base_uri = &writer->base_uri;
+ SerdNamespaces ns = writer->ns;
+
+ SerdChunk uri_prefix;
+ SerdChunk uri_suffix;
+ switch (type) {
+ case BLANK:
+ writer->sink("_:", 2, writer->stream);
+ writer->sink(str->buf, str->n_bytes - 1, writer->stream);
+ break;
+ case QNAME:
+ if (!serd_namespaces_expand(ns, str, &uri_prefix, &uri_suffix)) {
+ fprintf(stderr, "error: undefined namespace prefix `%s'\n", str->buf);
+ return false;
+ }
+ writer->sink("<", 1, writer->stream);
+ serd_write_ascii(writer, uri_prefix.buf, uri_prefix.len, '>');
+ serd_write_ascii(writer, uri_suffix.buf, uri_suffix.len, '>');
+ writer->sink(">", 1, writer->stream);
+ break;
+ case URI:
+ if (!serd_uri_string_has_scheme(str->buf)) {
+ SerdURI uri;
+ if (serd_uri_parse(str->buf, &uri)) {
+ SerdURI abs_uri;
+ if (serd_uri_resolve(&uri, base_uri, &abs_uri)) {
+ writer->sink("<", 1, writer->stream);
+ serd_uri_serialise(&abs_uri, writer->sink, writer->stream);
+ writer->sink(">", 1, writer->stream);
+ return true;
+ }
+ }
+ } else {
+ writer->sink("<", 1, writer->stream);
+ serd_write_ascii(writer, str->buf, str->n_bytes - 1, '>');
+ writer->sink(">", 1, writer->stream);
+ return true;
+ }
+ return false;
+ case LITERAL:
+ writer->sink("\"", 1, writer->stream);
+ serd_write_ascii(writer, str->buf, str->n_bytes - 1, '"');
+ writer->sink("\"", 1, writer->stream);
+ if (lang) {
+ writer->sink("@", 1, writer->stream);
+ writer->sink(lang->buf, lang->n_bytes - 1, writer->stream);
+ } else if (datatype) {
+ writer->sink("^^", 2, writer->stream);
+ serd_write_node(writer, URI, datatype, NULL, NULL);
+ }
+ break;
+ }
+ return true;
+}
+
+SERD_API
+bool
+serd_writer_write_statement(SerdWriter writer,
+ const SerdString* graph,
+ const SerdString* subject,
+ SerdNodeType subject_type,
+ const SerdString* predicate,
+ SerdNodeType predicate_type,
+ const SerdString* object,
+ SerdNodeType object_type,
+ const SerdString* object_datatype,
+ const SerdString* object_lang)
+{
+ serd_write_node(writer, subject_type, subject, NULL, NULL);
+ writer->sink(" ", 1, writer->stream);
+ serd_write_node(writer, predicate_type, predicate, NULL, NULL);
+ writer->sink(" ", 1, writer->stream);
+ serd_write_node(writer, object_type, object, object_datatype, object_lang);
+ writer->sink(" .\n", 3, writer->stream);
+ return true;
+}
+
+SERD_API
+SerdWriter
+serd_writer_new(SerdSyntax syntax,
+ SerdNamespaces ns,
+ const SerdURI* base_uri,
+ SerdSink sink,
+ void* stream)
+{
+ SerdWriter writer = malloc(sizeof(struct SerdWriterImpl));
+ writer->syntax = syntax;
+ writer->ns = ns;
+ writer->base_uri = *base_uri;
+ writer->sink = sink;
+ writer->stream = stream;
+ return writer;
+}
+
+SERD_API
+void
+serd_writer_set_base_uri(SerdWriter writer,
+ const SerdURI* uri)
+{
+ writer->base_uri = *uri;
+}
+
+SERD_API
+void
+serd_writer_free(SerdWriter writer)
+{
+ SerdWriter const me = (SerdWriter)writer;
+ free(me);
+}