/* Copyright 2011-2020 David Robillard Permission to use, copy, modify, and/or distribute this software for any purpose with or without fee is hereby granted, provided that the above copyright notice and this permission notice appear in all copies. THIS SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */ #undef NDEBUG #include "serd/serd.h" #include #include #include #include #include #include #define NS_XSD "http://www.w3.org/2001/XMLSchema#" static SerdStatus count_statements(void* handle, const SerdEvent* event) { if (event->type == SERD_STATEMENT) { ++*(size_t*)handle; } return SERD_SUCCESS; } /// Returns EOF after a statement, then succeeds again (like a socket) static size_t eof_test_read(void* buf, size_t size, size_t nmemb, void* stream) { assert(nmemb == 1); static const char* const string = "_:s1 _:o1 .\n" "_:s2 _:o2 .\n"; size_t* count = (size_t*)stream; if (*count == 34 || *count == 35 || *count + nmemb >= strlen(string)) { ++*count; return 0; } memcpy((char*)buf, string + *count, size * nmemb); *count += nmemb; return nmemb; } static int eof_test_error(void* stream) { (void)stream; return 0; } static void test_file_uri(const char* hostname, const char* path, const char* expected_uri, const char* expected_path) { if (!expected_path) { expected_path = path; } SerdNode* node = serd_new_file_uri(path, hostname); const char* node_str = serd_node_string(node); char* out_hostname = NULL; char* out_path = serd_file_uri_parse(node_str, &out_hostname); assert(!strcmp(node_str, expected_uri)); assert((hostname && out_hostname) || (!hostname && !out_hostname)); assert(!strcmp(out_path, expected_path)); serd_free(out_path); serd_free(out_hostname); serd_node_free(node); } static void test_read_chunks(void) { SerdWorld* world = serd_world_new(); size_t n_statements = 0; FILE* const f = tmpfile(); static const char null = 0; SerdSink* sink = serd_sink_new(&n_statements, NULL); assert(sink); serd_sink_set_event_func(sink, count_statements); SerdReader* reader = serd_reader_new(world, SERD_TURTLE, 0, sink, 4096); assert(reader); assert(f); SerdStatus st = serd_reader_start_stream(reader, (SerdReadFunc)fread, (SerdStreamErrorFunc)ferror, f, NULL, 1); assert(st == SERD_SUCCESS); // Write two statement separated by null characters fprintf(f, "@prefix eg: .\n"); fprintf(f, "eg:s eg:p eg:o1 .\n"); fwrite(&null, sizeof(null), 1, f); fprintf(f, "eg:s eg:p eg:o2 .\n"); fwrite(&null, sizeof(null), 1, f); fseek(f, 0, SEEK_SET); // Read prefix st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(n_statements == 0); // Read first statement st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(n_statements == 1); // Read terminator st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(n_statements == 1); // Read second statement (after null terminator) st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(n_statements == 2); // Read terminator st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(n_statements == 2); // EOF st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(n_statements == 2); serd_reader_free(reader); serd_sink_free(sink); fclose(f); serd_world_free(world); } static int test_get_blank(void) { SerdWorld* world = serd_world_new(); char expected[8]; for (unsigned i = 0; i < 32; ++i) { const SerdNode* blank = serd_world_get_blank(world); snprintf(expected, sizeof(expected), "b%u", i + 1); assert(!strcmp(serd_node_string(blank), expected)); } serd_world_free(world); return 0; } static int test_strict_write(void) { SerdWorld* world = serd_world_new(); const char* path = "serd_strict_write_test.ttl"; FILE* fd = fopen(path, "wb"); SerdEnv* env = serd_env_new(NULL); SerdWriter* writer = serd_writer_new(world, SERD_TURTLE, 0, env, (SerdWriteFunc)fwrite, fd); assert(fd); assert(writer); const SerdSink* sink = serd_writer_get_sink(writer); const uint8_t bad_str[] = {0xFF, 0x90, 'h', 'i', 0}; SerdNode* s = serd_new_uri("http://example.org/s"); SerdNode* p = serd_new_uri("http://example.org/s"); SerdNode* bad_lit = serd_new_string((const char*)bad_str); SerdNode* bad_uri = serd_new_uri((const char*)bad_str); assert(serd_sink_write(sink, 0, s, p, bad_lit, 0) == SERD_ERR_INVALID); assert(serd_sink_write(sink, 0, s, p, bad_uri, 0) == SERD_ERR_INVALID); serd_node_free(bad_uri); serd_node_free(bad_lit); serd_node_free(s); serd_node_free(p); serd_writer_free(writer); serd_env_free(env); fclose(fd); serd_world_free(world); return 0; } static void test_read_string(void) { SerdWorld* world = serd_world_new(); size_t n_statements = 0; SerdSink* sink = serd_sink_new(&n_statements, NULL); SerdReader* reader = serd_reader_new(world, SERD_TURTLE, 0, sink, 4096); assert(reader); serd_sink_set_event_func(sink, count_statements); // Test reading a string that ends exactly at the end of input (no newline) assert(!serd_reader_start_string( reader, " " " .", NULL)); assert(!serd_reader_read_document(reader)); assert(n_statements == 1); assert(!serd_reader_finish(reader)); serd_reader_free(reader); serd_sink_free(sink); serd_world_free(world); } static void test_integer_to_node(void) { const long int_test_nums[] = { 0, -0, -23, 23, -12340, 1000, -1000 }; const char* int_test_strs[] = { "0", "0", "-23", "23", "-12340", "1000", "-1000" }; for (size_t i = 0; i < sizeof(int_test_nums) / sizeof(double); ++i) { SerdNode* node = serd_new_integer(int_test_nums[i], NULL); const char* node_str = serd_node_string(node); assert(!strcmp(node_str, int_test_strs[i])); const size_t len = strlen(node_str); assert(serd_node_length(node) == len); assert(!strcmp(serd_node_string(serd_node_datatype(node)), NS_XSD "integer")); serd_node_free(node); } } static void test_boolean(void) { SerdNode* true_node = serd_new_boolean(true); assert(!strcmp(serd_node_string(true_node), "true")); assert(!strcmp(serd_node_string(serd_node_datatype(true_node)), NS_XSD "boolean")); serd_node_free(true_node); SerdNode* false_node = serd_new_boolean(false); assert(!strcmp(serd_node_string(false_node), "false")); assert(!strcmp(serd_node_string(serd_node_datatype(false_node)), NS_XSD "boolean")); serd_node_free(false_node); } static void test_blob_to_node(void) { assert(!serd_new_blob(NULL, 0, true, NULL)); assert(!serd_new_blob("data", 0, true, NULL)); for (size_t size = 1; size < 256; ++size) { uint8_t* data = size > 0 ? (uint8_t*)malloc(size) : NULL; for (size_t i = 0; i < size; ++i) { data[i] = (uint8_t)((size + i) % 256); } size_t out_size = 0; SerdNode* blob = serd_new_blob(data, size, size % 5, NULL); const char* blob_str = serd_node_string(blob); const size_t len = serd_node_length(blob); uint8_t* out = (uint8_t*)malloc(serd_base64_decoded_size(len)); assert(!serd_base64_decode(out, &out_size, blob_str, len)); assert(serd_node_length(blob) == strlen(blob_str)); assert(out_size == size); for (size_t i = 0; i < size; ++i) { assert(out[i] == data[i]); } assert(!strcmp(serd_node_string(serd_node_datatype(blob)), NS_XSD "base64Binary")); serd_node_free(blob); free(out); free(data); } } static void test_strlen(void) { const uint8_t str[] = { '"', '5', 0xE2, 0x82, 0xAC, '"', '\n', 0 }; SerdNodeFlags flags = 0; size_t n_bytes = serd_strlen((const char*)str, &flags); assert(n_bytes == 7 && flags == (SERD_HAS_QUOTE|SERD_HAS_NEWLINE)); assert(serd_strlen((const char*)str, NULL) == 7); } static void test_strerror(void) { const char* msg = serd_strerror(SERD_SUCCESS); assert(!strcmp(msg, "Success")); for (int i = SERD_FAILURE; i <= SERD_ERR_BAD_WRITE; ++i) { msg = serd_strerror((SerdStatus)i); assert(strcmp(msg, "Success")); } msg = serd_strerror((SerdStatus)-1); assert(!strcmp(msg, "Unknown error")); } static void test_uri_parsing(void) { test_file_uri(NULL, "C:/My 100%", "file:///C:/My%20100%%", NULL); test_file_uri("ahost", "C:\\Pointless Space", "file://ahost/C:/Pointless%20Space", "C:/Pointless Space"); test_file_uri(NULL, "/foo/bar", "file:///foo/bar", NULL); test_file_uri("bhost", "/foo/bar", "file://bhost/foo/bar", NULL); test_file_uri(NULL, "a/relative ", "a/relative%20%3Cpath%3E", NULL); // Test tolerance of parsing junk URI escapes char* out_path = serd_file_uri_parse("file:///foo/%0Xbar", NULL); assert(!strcmp(out_path, "/foo/bar")); serd_free(out_path); } static void test_node_equals(void) { const uint8_t replacement_char_str[] = { 0xEF, 0xBF, 0xBD, 0 }; SerdNode* lhs = serd_new_string((const char*)replacement_char_str); SerdNode* rhs = serd_new_string("123"); assert(!serd_node_equals(lhs, rhs)); SerdNode* qnode = serd_new_curie("foo:bar"); assert(!serd_node_equals(lhs, qnode)); serd_node_free(qnode); assert(!serd_node_copy(NULL)); serd_node_free(lhs); serd_node_free(rhs); } static void test_node_from_string(void) { assert(!serd_new_string(NULL)); SerdNode* hello = serd_new_string("hello\""); assert(serd_node_length(hello) == 6); assert(serd_node_flags(hello) == SERD_HAS_QUOTE); assert(!strncmp(serd_node_string(hello), "hello\"", 6)); serd_node_free(hello); } static void test_node_from_substring(void) { assert(!serd_new_substring(NULL, 32)); SerdNode* a_b = serd_new_substring("a\"bc", 3); assert(serd_node_length(a_b) == 3); assert(serd_node_flags(a_b) == SERD_HAS_QUOTE); assert(strlen(serd_node_string(a_b)) == 3); assert(!strncmp(serd_node_string(a_b), "a\"b", 3)); serd_node_free(a_b); a_b = serd_new_substring("a\"bc", 10); assert(serd_node_length(a_b) == 4); assert(serd_node_flags(a_b) == SERD_HAS_QUOTE); assert(strlen(serd_node_string(a_b)) == 4); assert(!strncmp(serd_node_string(a_b), "a\"bc", 4)); serd_node_free(a_b); } static void test_simple_node(void) { assert(!serd_new_simple_node(SERD_LITERAL, "Literal", 7)); assert(!serd_new_simple_node(SERD_URI, NULL, 0)); } static void test_literal(void) { assert(!serd_new_literal(NULL, 0, NULL, 0, NULL, 0)); assert(!serd_new_plain_literal(NULL, NULL)); assert(!serd_new_typed_literal(NULL, NULL)); SerdNode* hello2 = serd_new_string("hello\""); assert(!serd_new_typed_literal("bad type", hello2)); assert(serd_node_length(hello2) == 6 && serd_node_flags(hello2) == SERD_HAS_QUOTE && !strcmp(serd_node_string(hello2), "hello\"")); SerdNode* hello3 = serd_new_plain_literal("hello\"", NULL); assert(serd_node_equals(hello2, hello3)); SerdNode* hello4 = serd_new_typed_literal("hello\"", NULL); assert(serd_node_equals(hello4, hello2)); serd_node_free(hello4); serd_node_free(hello3); serd_node_free(hello2); const char* lang_lit_str = "\"Hello\"@en"; SerdNode* sliced_lang_lit = serd_new_literal(lang_lit_str + 1, 5, NULL, 0, lang_lit_str + 8, 2); assert(!strcmp(serd_node_string(sliced_lang_lit), "Hello")); assert(!strcmp( serd_node_string(serd_node_language(sliced_lang_lit)), "en")); serd_node_free(sliced_lang_lit); const char* type_lit_str = "\"Hallo\"^^"; SerdNode* sliced_type_lit = serd_new_literal(type_lit_str + 1, 5, type_lit_str + 10, 27, NULL, 0); assert(!strcmp(serd_node_string(sliced_type_lit), "Hallo")); assert(!strcmp( serd_node_string(serd_node_datatype(sliced_type_lit)), "http://example.org/Greeting")); serd_node_free(sliced_type_lit); SerdNode* plain_lit = serd_new_literal("Plain", 5, NULL, 0, NULL, 0); assert(!strcmp(serd_node_string(plain_lit), "Plain")); serd_node_free(plain_lit); } static void test_uri_from_string(void) { assert(!serd_new_uri(NULL)); SerdNode* base = serd_new_uri("http://example.org/a/b/c/"); SerdNode* not_a_uri = serd_new_string("hello"); SerdNode* nil = serd_new_resolved_uri(NULL, base); SerdNode* nil2 = serd_new_resolved_uri("", base); assert(!serd_new_resolved_uri("", NULL)); assert(!serd_new_resolved_uri("", not_a_uri)); assert(serd_node_type(nil) == SERD_URI); assert(!strcmp(serd_node_string(nil), serd_node_string(base))); assert(serd_node_type(nil2) == SERD_URI); assert(!strcmp(serd_node_string(nil2), serd_node_string(base))); serd_node_free(nil2); serd_node_free(nil); serd_node_free(not_a_uri); serd_node_free(base); } static void check_rel_uri(const char* uri, const SerdNode* base, const SerdNode* root, const char* expected) { SerdNode* rel = serd_new_relative_uri(uri, base, root); const int ret = strcmp(serd_node_string(rel), expected); serd_node_free(rel); assert(!ret); } static void test_relative_uri(void) { SerdNode* root = serd_new_uri("http://example.org/a/b/ignored"); SerdNode* base = serd_new_uri("http://example.org/a/b/c/"); check_rel_uri("http://example.org/a/b/c/foo", base, NULL, "foo"); check_rel_uri("http://example.org/a/", base, NULL, "../../"); check_rel_uri("http://example.org/a/", base, root, "http://example.org/a/"); check_rel_uri("http://example.org/a/b/x", root, root, "x"); check_rel_uri("http://example.org/", base, NULL, "../../../"); check_rel_uri("http://drobilla.net/a", base, NULL, "http://drobilla.net/a"); serd_node_free(base); serd_node_free(root); } static void test_uri_resolution(void) { SerdNode* base = serd_new_uri("http://example.org/a/b/c/"); SerdNode* nil = serd_new_resolved_uri(NULL, base); SerdNode* nil2 = serd_new_resolved_uri("", base); SerdNode* not_a_uri = serd_new_string("hello"); SerdNode* root = serd_new_uri("http://example.org/a/b/"); assert(!serd_node_resolve(NULL, base)); assert(!serd_node_resolve(nil, NULL)); assert(!serd_node_resolve(not_a_uri, base)); assert(!serd_node_resolve(nil, not_a_uri)); SerdNode* rel = serd_new_relative_uri( "http://example.org/a/b/c/foo", base, NULL); SerdNode* resolved = serd_node_resolve(rel, base); assert(!strcmp(serd_node_string(resolved), "http://example.org/a/b/c/foo")); serd_node_free(nil); serd_node_free(nil2); serd_node_free(not_a_uri); serd_node_free(resolved); serd_node_free(rel); serd_node_free(base); serd_node_free(root); } static void test_blank(void) { assert(!serd_new_blank(NULL)); SerdNode* blank = serd_new_blank("b0"); assert(serd_node_length(blank) == 2); assert(serd_node_flags(blank) == 0); assert(!strcmp(serd_node_string(blank), "b0")); serd_node_free(blank); } static void test_writer(const char* const path) { FILE* fd = fopen(path, "wb"); SerdEnv* env = serd_env_new(NULL); assert(fd); SerdWorld* world = serd_world_new(); SerdWriter* writer = serd_writer_new(world, SERD_TURTLE, SERD_WRITE_LAX, env, (SerdWriteFunc)fwrite, fd); assert(writer); serd_writer_chop_blank_prefix(writer, "tmp"); serd_writer_chop_blank_prefix(writer, NULL); SerdNode* lit = serd_new_string("hello"); const SerdSink* iface = serd_writer_get_sink(writer); assert(serd_sink_write_base(iface, lit)); assert(serd_sink_write_prefix(iface, lit, lit)); assert(serd_sink_write_end(iface, NULL)); assert(serd_writer_env(writer) == env); uint8_t buf[] = { 0xEF, 0xBF, 0xBD, 0 }; SerdNode* s = serd_new_uri(""); SerdNode* p = serd_new_uri("http://example.org/pred"); SerdNode* o = serd_new_string((char*)buf); // Write 3 invalid statements (should write nothing) const SerdNode* junk[][5] = { { s, p, NULL }, { s, NULL, o }, { NULL, p, o }, { s, p, NULL }, { s, NULL, o }, { NULL, p, o }, { s, o, o }, { o, p, o }, { s, p, NULL }, { NULL, NULL, NULL } }; for (size_t i = 0; i < sizeof(junk) / (sizeof(SerdNode*) * 5); ++i) { assert(serd_sink_write( iface, 0, junk[i][0], junk[i][1], junk[i][2], 0)); } SerdNode* urn_Type = serd_new_uri("urn:Type"); SerdNode* t = serd_new_typed_literal((char*)buf, urn_Type); SerdNode* l = serd_new_plain_literal((char*)buf, "en"); const SerdNode* good[][5] = { { s, p, o }, { s, p, o }, { s, p, t }, { s, p, l }, { s, p, l }, { s, p, t }, { s, p, l }, { s, p, o }, { s, p, o }, { s, p, o } }; for (size_t i = 0; i < sizeof(good) / (sizeof(SerdNode*) * 5); ++i) { assert(!serd_sink_write( iface, 0, good[i][0], good[i][1], good[i][2], 0)); } // Write statements with bad UTF-8 (should be replaced) const uint8_t bad_str[] = { 0xFF, 0x90, 'h', 'i', 0 }; SerdNode* bad_lit = serd_new_string((const char*)bad_str); SerdNode* bad_uri = serd_new_uri((const char*)bad_str); assert(!serd_sink_write(iface, 0, s, p, bad_lit, 0)); assert(!serd_sink_write(iface, 0, s, p, bad_uri, 0)); serd_node_free(bad_uri); serd_node_free(bad_lit); // Write 1 valid statement serd_node_free(o); o = serd_new_string("hello"); assert(!serd_sink_write(iface, 0, s, p, o, 0)); serd_writer_free(writer); serd_node_free(lit); serd_node_free(o); serd_node_free(t); serd_node_free(l); serd_node_free(urn_Type); // Test buffer sink SerdBuffer buffer = { NULL, 0 }; SerdByteSink* byte_sink = serd_byte_sink_new((SerdWriteFunc)serd_buffer_sink, &buffer, 1); writer = serd_writer_new(world, SERD_TURTLE, 0, env, (SerdWriteFunc)serd_byte_sink_write, byte_sink); o = serd_new_uri("http://example.org/base"); assert(!serd_writer_set_base_uri(writer, o)); serd_node_free(o); serd_writer_free(writer); serd_byte_sink_free(byte_sink); char* out = serd_buffer_sink_finish(&buffer); assert(!strcmp(out, "@base .\n")); serd_free(out); serd_env_free(env); serd_world_free(world); fclose(fd); } static void test_reader(const char* path) { SerdWorld* world = serd_world_new(); size_t n_statements = 0; SerdSink* sink = serd_sink_new(&n_statements, NULL); serd_sink_set_event_func(sink, count_statements); SerdReader* reader = serd_reader_new(world, SERD_TURTLE, 0, sink, 4096); assert(reader); assert(serd_reader_read_document(reader) == SERD_FAILURE); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); serd_reader_add_blank_prefix(reader, "tmp"); serd_reader_add_blank_prefix(reader, NULL); assert(serd_reader_start_file(reader, "http://notafile", false)); assert(serd_reader_start_file(reader, "file://invalid", false)); assert(serd_reader_start_file(reader, "file:///nonexistant", false)); assert(!serd_reader_start_file(reader, path, true)); assert(!serd_reader_read_document(reader)); assert(n_statements == 13); serd_reader_finish(reader); // A read of a big page hits EOF then fails to read chunks immediately { FILE* temp = tmpfile(); assert(temp); fprintf(temp, "_:s _:o .\n"); fflush(temp); fseek(temp, 0L, SEEK_SET); serd_reader_start_stream(reader, (SerdReadFunc)fread, (SerdStreamErrorFunc)ferror, temp, NULL, 4096); assert(serd_reader_read_chunk(reader) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); serd_reader_finish(reader); fclose(temp); } // A byte-wise reader that hits EOF once then continues (like a socket) { size_t n_reads = 0; serd_reader_start_stream(reader, (SerdReadFunc)eof_test_read, (SerdStreamErrorFunc)eof_test_error, &n_reads, NULL, 1); assert(serd_reader_read_chunk(reader) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(serd_reader_read_chunk(reader) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); } serd_reader_free(reader); serd_sink_free(sink); serd_world_free(world); } int main(void) { test_integer_to_node(); test_blob_to_node(); test_boolean(); test_strlen(); test_strerror(); test_uri_parsing(); test_node_equals(); test_node_from_string(); test_node_from_substring(); test_simple_node(); test_literal(); test_uri_from_string(); test_relative_uri(); test_uri_resolution(); test_blank(); test_read_chunks(); test_read_string(); test_get_blank(); test_strict_write(); const char* const path = "serd_test.ttl"; test_writer(path); test_reader(path); printf("Success\n"); return 0; }