/* Copyright 2011-2020 David Robillard Permission to use, copy, modify, and/or distribute this software for any purpose with or without fee is hereby granted, provided that the above copyright notice and this permission notice appear in all copies. THIS SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */ #undef NDEBUG #include "serd/serd.h" #include #include #include #include #include #include #include #include #ifndef INFINITY # define INFINITY (DBL_MAX + DBL_MAX) #endif #ifndef NAN # define NAN (INFINITY - INFINITY) #endif #define NS_XSD "http://www.w3.org/2001/XMLSchema#" static void test_strtod(double dbl, double max_delta) { char buf[1024]; snprintf(buf, sizeof(buf), "%f", dbl); size_t end = 0; const double out = serd_strtod(buf, &end); const double diff = fabs(out - dbl); assert(diff <= max_delta); assert(end == strlen(buf)); } typedef struct { int n_statements; const SerdNode* graph; } ReaderTest; static SerdStatus test_sink(void* handle, SerdStatementFlags flags, const SerdStatement* statement) { (void)flags; (void)statement; ReaderTest* rt = (ReaderTest*)handle; ++rt->n_statements; rt->graph = serd_statement_graph(statement); return SERD_SUCCESS; } /// Returns EOF after a statement, then succeeds again (like a socket) static size_t eof_test_read(void* buf, size_t size, size_t nmemb, void* stream) { assert(nmemb == 1); static const char* const string = "_:s1 _:o1 .\n" "_:s2 _:o2 .\n"; size_t* count = (size_t*)stream; if (*count == 34 || *count == 35 || *count + nmemb >= strlen(string)) { ++*count; return 0; } memcpy((char*)buf, string + *count, size * nmemb); *count += nmemb; return nmemb; } static int eof_test_error(void* stream) { (void)stream; return 0; } static void test_file_uri(const char* hostname, const char* path, const char* expected_uri, const char* expected_path) { if (!expected_path) { expected_path = path; } SerdNode* node = serd_new_file_uri(path, hostname); const char* node_str = serd_node_string(node); char* out_hostname = NULL; char* out_path = serd_file_uri_parse(node_str, &out_hostname); assert(!strcmp(node_str, expected_uri)); assert((hostname && out_hostname) || (!hostname && !out_hostname)); assert(!strcmp(out_path, expected_path)); serd_free(out_path); serd_free(out_hostname); serd_node_free(node); } static void test_read_chunks(void) { SerdWorld* world = serd_world_new(); ReaderTest* const rt = (ReaderTest*)calloc(1, sizeof(ReaderTest)); FILE* const f = tmpfile(); static const char null = 0; SerdSink sink = {rt, NULL, NULL, test_sink, NULL}; SerdReader* reader = serd_reader_new(world, SERD_TURTLE, &sink, 4096); assert(reader); assert(f); SerdStatus st = serd_reader_start_stream(reader, (SerdReadFunc)fread, (SerdStreamErrorFunc)ferror, f, NULL, 1); assert(st == SERD_SUCCESS); // Write two statement separated by null characters fprintf(f, "@prefix eg: .\n"); fprintf(f, "eg:s eg:p eg:o1 .\n"); fwrite(&null, sizeof(null), 1, f); fprintf(f, "eg:s eg:p eg:o2 .\n"); fwrite(&null, sizeof(null), 1, f); fseek(f, 0, SEEK_SET); // Read prefix st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt->n_statements == 0); // Read first statement st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt->n_statements == 1); // Read terminator st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(rt->n_statements == 1); // Read second statement (after null terminator) st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt->n_statements == 2); // Read terminator st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(rt->n_statements == 2); // EOF st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(rt->n_statements == 2); serd_reader_free(reader); fclose(f); free(rt); serd_world_free(world); } static int test_get_blank(void) { SerdWorld* world = serd_world_new(); char expected[8]; for (unsigned i = 0; i < 32; ++i) { const SerdNode* blank = serd_world_get_blank(world); snprintf(expected, sizeof(expected), "b%u", i + 1); assert(!strcmp(serd_node_string(blank), expected)); } serd_world_free(world); return 0; } static void test_read_string(void) { SerdWorld* world = serd_world_new(); ReaderTest* rt = (ReaderTest*)calloc(1, sizeof(ReaderTest)); SerdSink sink = {rt, NULL, NULL, test_sink, NULL}; SerdReader* reader = serd_reader_new(world, SERD_TURTLE, &sink, 4096); assert(reader); // Test reading a string that ends exactly at the end of input (no newline) assert(!serd_reader_start_string( reader, " " " .", NULL)); assert(!serd_reader_read_document(reader)); assert(rt->n_statements == 1); assert(!serd_reader_finish(reader)); serd_reader_free(reader); serd_world_free(world); } static void test_string_to_double(void) { size_t end = 0; assert(isnan(serd_strtod("NaN", &end))); assert(end == 3); assert(isinf(serd_strtod("INF", &end)) == 1); assert(end == 3); assert(isinf(serd_strtod("-INF", &end)) == -1); assert(end == 4); const double expt_test_nums[] = { 2.0E18, -5e19, +8e20, 2e+24, -5e-5, 8e0, 9e-0, 2e+0 }; const char* expt_test_strs[] = { "02e18", "-5e019", "+8e20", "2E+24", "-5E-5", "8E0", "9e-0", " 2e+0" }; for (size_t i = 0; i < sizeof(expt_test_nums) / sizeof(double); ++i) { const double num = serd_strtod(expt_test_strs[i], NULL); const double delta = fabs(num - expt_test_nums[i]); assert(delta <= DBL_EPSILON); test_strtod(expt_test_nums[i], DBL_EPSILON); } } static void test_double_to_node(void) { const double dbl_test_nums[] = { 0.0, 9.0, 10.0, .01, 2.05, -16.00001, 5.000000005, 0.0000000001, NAN, INFINITY }; const char* dbl_test_strs[] = { "0.0", "9.0", "10.0", "0.01", "2.05", "-16.00001", "5.00000001", "0.0", NULL, NULL }; for (size_t i = 0; i < sizeof(dbl_test_nums) / sizeof(double); ++i) { SerdNode* node = serd_new_decimal(dbl_test_nums[i], 8, NULL); const char* node_str = serd_node_string(node); const bool pass = (node_str && dbl_test_strs[i]) ? !strcmp(node_str, dbl_test_strs[i]) : (node_str == dbl_test_strs[i]); assert(pass); const size_t len = node_str ? strlen(node_str) : 0; assert(serd_node_length(node) == len); assert(!dbl_test_strs[i] || !strcmp(serd_node_string(serd_node_datatype(node)), NS_XSD "decimal")); serd_node_free(node); } } static void test_integer_to_node(void) { const long int_test_nums[] = { 0, -0, -23, 23, -12340, 1000, -1000 }; const char* int_test_strs[] = { "0", "0", "-23", "23", "-12340", "1000", "-1000" }; for (size_t i = 0; i < sizeof(int_test_nums) / sizeof(double); ++i) { SerdNode* node = serd_new_integer(int_test_nums[i], NULL); const char* node_str = serd_node_string(node); assert(!strcmp(node_str, int_test_strs[i])); const size_t len = strlen(node_str); assert(serd_node_length(node) == len); assert(!strcmp(serd_node_string(serd_node_datatype(node)), NS_XSD "integer")); serd_node_free(node); } } static void test_blob_to_node(void) { assert(!serd_new_blob(NULL, 0, true, NULL)); assert(!serd_new_blob("data", 0, true, NULL)); for (size_t size = 1; size < 256; ++size) { uint8_t* data = size > 0 ? (uint8_t*)malloc(size) : NULL; for (size_t i = 0; i < size; ++i) { data[i] = (uint8_t)((size + i) % 256); } size_t out_size = 0; SerdNode* blob = serd_new_blob(data, size, size % 5, NULL); const char* blob_str = serd_node_string(blob); uint8_t* out = (uint8_t*)serd_base64_decode( blob_str, serd_node_length(blob), &out_size); assert(serd_node_length(blob) == strlen(blob_str)); assert(out_size == size); for (size_t i = 0; i < size; ++i) { assert(out[i] == data[i]); } assert(!strcmp(serd_node_string(serd_node_datatype(blob)), NS_XSD "base64Binary")); serd_node_free(blob); serd_free(out); free(data); } } static void test_strlen(void) { const uint8_t str[] = { '"', '5', 0xE2, 0x82, 0xAC, '"', '\n', 0 }; SerdNodeFlags flags = 0; size_t n_bytes = serd_strlen((const char*)str, &flags); assert(n_bytes == 7 && flags == (SERD_HAS_QUOTE|SERD_HAS_NEWLINE)); assert(serd_strlen((const char*)str, NULL) == 7); } static void test_strerror(void) { const char* msg = serd_strerror(SERD_SUCCESS); assert(!strcmp(msg, "Success")); for (int i = SERD_FAILURE; i <= SERD_ERR_OVERFLOW; ++i) { msg = serd_strerror((SerdStatus)i); assert(strcmp(msg, "Success")); } msg = serd_strerror((SerdStatus)-1); assert(!strcmp(msg, "Unknown error")); } static void test_uri_parsing(void) { test_file_uri(NULL, "C:/My 100%", "file:///C:/My%20100%%", NULL); test_file_uri("ahost", "C:\\Pointless Space", "file://ahost/C:/Pointless%20Space", "C:/Pointless Space"); test_file_uri(NULL, "/foo/bar", "file:///foo/bar", NULL); test_file_uri("bhost", "/foo/bar", "file://bhost/foo/bar", NULL); test_file_uri(NULL, "a/relative ", "a/relative%20%3Cpath%3E", NULL); // Test tolerance of parsing junk URI escapes char* out_path = serd_file_uri_parse("file:///foo/%0Xbar", NULL); assert(!strcmp(out_path, "/foo/bar")); serd_free(out_path); } static void test_node_equals(void) { const uint8_t replacement_char_str[] = { 0xEF, 0xBF, 0xBD, 0 }; SerdNode* lhs = serd_new_string((const char*)replacement_char_str); SerdNode* rhs = serd_new_string("123"); assert(!serd_node_equals(lhs, rhs)); SerdNode* qnode = serd_new_curie("foo:bar"); assert(!serd_node_equals(lhs, qnode)); serd_node_free(qnode); assert(!serd_node_copy(NULL)); serd_node_free(lhs); serd_node_free(rhs); } static void test_node_from_string(void) { assert(!serd_new_string(NULL)); SerdNode* hello = serd_new_string("hello\""); assert(serd_node_length(hello) == 6); assert(serd_node_flags(hello) == SERD_HAS_QUOTE); assert(!strncmp(serd_node_string(hello), "hello\"", 6)); serd_node_free(hello); } static void test_node_from_substring(void) { assert(!serd_new_substring(NULL, 32)); SerdNode* a_b = serd_new_substring("a\"bc", 3); assert(serd_node_length(a_b) == 3); assert(serd_node_flags(a_b) == SERD_HAS_QUOTE); assert(strlen(serd_node_string(a_b)) == 3); assert(!strncmp(serd_node_string(a_b), "a\"b", 3)); serd_node_free(a_b); a_b = serd_new_substring("a\"bc", 10); assert(serd_node_length(a_b) == 4); assert(serd_node_flags(a_b) == SERD_HAS_QUOTE); assert(strlen(serd_node_string(a_b)) == 4); assert(!strncmp(serd_node_string(a_b), "a\"bc", 4)); serd_node_free(a_b); } static void test_simple_node(void) { assert(!serd_new_simple_node(SERD_LITERAL, "Literal", 7)); assert(!serd_new_simple_node(SERD_URI, NULL, 0)); } static void test_literal(void) { assert(!serd_new_literal(NULL, 0, NULL, 0, NULL, 0)); assert(!serd_new_plain_literal(NULL, NULL)); assert(!serd_new_typed_literal(NULL, NULL)); SerdNode* hello2 = serd_new_string("hello\""); assert(!serd_new_typed_literal("bad type", hello2)); assert(serd_node_length(hello2) == 6 && serd_node_flags(hello2) == SERD_HAS_QUOTE && !strcmp(serd_node_string(hello2), "hello\"")); SerdNode* hello3 = serd_new_plain_literal("hello\"", NULL); assert(serd_node_equals(hello2, hello3)); SerdNode* hello4 = serd_new_typed_literal("hello\"", NULL); assert(serd_node_equals(hello4, hello2)); serd_node_free(hello4); serd_node_free(hello3); serd_node_free(hello2); const char* lang_lit_str = "\"Hello\"@en"; SerdNode* sliced_lang_lit = serd_new_literal(lang_lit_str + 1, 5, NULL, 0, lang_lit_str + 8, 2); assert(!strcmp(serd_node_string(sliced_lang_lit), "Hello")); assert(!strcmp( serd_node_string(serd_node_language(sliced_lang_lit)), "en")); serd_node_free(sliced_lang_lit); const char* type_lit_str = "\"Hallo\"^^"; SerdNode* sliced_type_lit = serd_new_literal(type_lit_str + 1, 5, type_lit_str + 10, 27, NULL, 0); assert(!strcmp(serd_node_string(sliced_type_lit), "Hallo")); assert(!strcmp( serd_node_string(serd_node_datatype(sliced_type_lit)), "http://example.org/Greeting")); serd_node_free(sliced_type_lit); SerdNode* plain_lit = serd_new_literal("Plain", 5, NULL, 0, NULL, 0); assert(!strcmp(serd_node_string(plain_lit), "Plain")); serd_node_free(plain_lit); } static void test_uri_from_string(void) { assert(!serd_new_uri(NULL)); SerdNode* base = serd_new_uri("http://example.org/a/b/c/"); SerdNode* not_a_uri = serd_new_string("hello"); SerdNode* nil = serd_new_resolved_uri(NULL, base); SerdNode* nil2 = serd_new_resolved_uri("", base); assert(!serd_new_resolved_uri("", NULL)); assert(!serd_new_resolved_uri("", not_a_uri)); assert(serd_node_type(nil) == SERD_URI); assert(!strcmp(serd_node_string(nil), serd_node_string(base))); assert(serd_node_type(nil2) == SERD_URI); assert(!strcmp(serd_node_string(nil2), serd_node_string(base))); serd_node_free(nil2); serd_node_free(nil); serd_node_free(not_a_uri); serd_node_free(base); } static void check_rel_uri(const char* uri, const SerdNode* base, const SerdNode* root, const char* expected) { SerdNode* rel = serd_new_relative_uri(uri, base, root); const int ret = strcmp(serd_node_string(rel), expected); serd_node_free(rel); assert(!ret); } static void test_relative_uri(void) { SerdNode* root = serd_new_uri("http://example.org/a/b/"); SerdNode* base = serd_new_uri("http://example.org/a/b/c/"); check_rel_uri("http://example.org/a/b/c/foo", base, NULL, "foo"); check_rel_uri("http://example.org/a/", base, NULL, "../../"); check_rel_uri("http://example.org/a/", base, root, "http://example.org/a/"); check_rel_uri("http://example.org/", base, NULL, "../../../"); check_rel_uri("http://drobilla.net/a", base, NULL, "http://drobilla.net/a"); serd_node_free(base); serd_node_free(root); } static void test_uri_resolution(void) { SerdNode* base = serd_new_uri("http://example.org/a/b/c/"); SerdNode* nil = serd_new_resolved_uri(NULL, base); SerdNode* nil2 = serd_new_resolved_uri("", base); SerdNode* not_a_uri = serd_new_string("hello"); SerdNode* root = serd_new_uri("http://example.org/a/b/"); assert(!serd_node_resolve(NULL, base)); assert(!serd_node_resolve(nil, NULL)); assert(!serd_node_resolve(not_a_uri, base)); assert(!serd_node_resolve(nil, not_a_uri)); SerdNode* rel = serd_new_relative_uri( "http://example.org/a/b/c/foo", base, NULL); SerdNode* resolved = serd_node_resolve(rel, base); assert(!strcmp(serd_node_string(resolved), "http://example.org/a/b/c/foo")); serd_node_free(nil); serd_node_free(nil2); serd_node_free(not_a_uri); serd_node_free(resolved); serd_node_free(rel); serd_node_free(base); serd_node_free(root); } static void test_blank(void) { assert(!serd_new_blank(NULL)); SerdNode* blank = serd_new_blank("b0"); assert(serd_node_length(blank) == 2); assert(serd_node_flags(blank) == 0); assert(!strcmp(serd_node_string(blank), "b0")); serd_node_free(blank); } static void test_writer(const char* const path) { FILE* fd = fopen(path, "wb"); SerdEnv* env = serd_env_new(NULL); assert(fd); SerdWorld* world = serd_world_new(); SerdWriter* writer = serd_writer_new(world, SERD_TURTLE, (SerdStyle)0, env, (SerdWriteFunc)fwrite, fd); assert(writer); serd_writer_chop_blank_prefix(writer, "tmp"); serd_writer_chop_blank_prefix(writer, NULL); SerdNode* lit = serd_new_string("hello"); const SerdSink* iface = serd_writer_get_sink(writer); assert(iface->base(iface->handle, lit)); assert(iface->prefix(iface->handle, lit, lit)); assert(iface->end(iface->handle, NULL)); assert(serd_writer_env(writer) == env); uint8_t buf[] = { 0xEF, 0xBF, 0xBD, 0 }; SerdNode* s = serd_new_uri(""); SerdNode* p = serd_new_uri("http://example.org/pred"); SerdNode* o = serd_new_string((char*)buf); // Write 3 invalid statements (should write nothing) const SerdNode* junk[][5] = { { s, p, NULL }, { s, NULL, o }, { NULL, p, o }, { s, p, NULL }, { s, NULL, o }, { NULL, p, o }, { s, o, o }, { o, p, o }, { s, p, NULL }, { NULL, NULL, NULL } }; for (size_t i = 0; i < sizeof(junk) / (sizeof(SerdNode*) * 5); ++i) { assert(serd_sink_write( iface, 0, junk[i][0], junk[i][1], junk[i][2], 0)); } SerdNode* urn_Type = serd_new_uri("urn:Type"); SerdNode* t = serd_new_typed_literal((char*)buf, urn_Type); SerdNode* l = serd_new_plain_literal((char*)buf, "en"); const SerdNode* good[][5] = { { s, p, o }, { s, p, o }, { s, p, t }, { s, p, l }, { s, p, l }, { s, p, t }, { s, p, l }, { s, p, o }, { s, p, o }, { s, p, o } }; for (size_t i = 0; i < sizeof(good) / (sizeof(SerdNode*) * 5); ++i) { assert(!serd_sink_write( iface, 0, good[i][0], good[i][1], good[i][2], 0)); } // Write statements with bad UTF-8 (should be replaced) const char bad_str[] = { (char)0xFF, (char)0x90, 'h', 'i', 0 }; SerdNode* bad_lit = serd_new_string(bad_str); SerdNode* bad_uri = serd_new_uri(bad_str); assert(!serd_sink_write(iface, 0, s, p, bad_lit, 0)); assert(!serd_sink_write(iface, 0, s, p, bad_uri, 0)); serd_node_free(bad_uri); serd_node_free(bad_lit); // Write 1 valid statement serd_node_free(o); o = serd_new_string("hello"); assert(!serd_sink_write(iface, 0, s, p, o, 0)); serd_writer_free(writer); serd_node_free(lit); serd_node_free(o); serd_node_free(t); serd_node_free(l); serd_node_free(urn_Type); // Test buffer sink SerdBuffer buffer = { NULL, 0 }; writer = serd_writer_new( world, SERD_TURTLE, (SerdStyle)0, env, serd_buffer_sink, &buffer); o = serd_new_uri("http://example.org/base"); assert(!serd_writer_set_base_uri(writer, o)); serd_node_free(o); serd_writer_free(writer); char* out = serd_buffer_sink_finish(&buffer); assert(!strcmp(out, "@base .\n")); serd_free(out); serd_env_free(env); serd_world_free(world); fclose(fd); } static void test_reader(const char* path) { SerdWorld* world = serd_world_new(); ReaderTest rt = { 0, NULL }; SerdSink sink = { &rt, NULL, NULL, test_sink, NULL }; SerdReader* reader = serd_reader_new(world, SERD_TURTLE, &sink, 4096); assert(reader); SerdNode* g = serd_new_uri("http://example.org/"); serd_reader_set_default_graph(reader, g); serd_reader_add_blank_prefix(reader, "tmp"); serd_reader_add_blank_prefix(reader, NULL); serd_node_free(g); assert(serd_reader_start_file(reader, "http://notafile", false)); assert(serd_reader_start_file(reader, "file://invalid", false)); assert(serd_reader_start_file(reader, "file:///nonexistant", false)); assert(!serd_reader_start_file(reader, path, true)); assert(!serd_reader_read_document(reader)); assert(rt.n_statements == 13); assert(rt.graph && serd_node_string(rt.graph) && !strcmp(serd_node_string(rt.graph), "http://example.org/")); serd_reader_finish(reader); // A read of a big page hits EOF then fails to read chunks immediately { FILE* temp = tmpfile(); assert(temp); fprintf(temp, "_:s _:o .\n"); fflush(temp); fseek(temp, 0L, SEEK_SET); serd_reader_start_stream(reader, (SerdReadFunc)fread, (SerdStreamErrorFunc)ferror, temp, NULL, 4096); assert(serd_reader_read_chunk(reader) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); serd_reader_finish(reader); fclose(temp); } // A byte-wise reader that hits EOF once then continues (like a socket) { size_t n_reads = 0; serd_reader_start_stream(reader, (SerdReadFunc)eof_test_read, (SerdStreamErrorFunc)eof_test_error, &n_reads, NULL, 1); assert(serd_reader_read_chunk(reader) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(serd_reader_read_chunk(reader) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); } serd_reader_free(reader); serd_world_free(world); } int main(void) { test_string_to_double(); test_double_to_node(); test_integer_to_node(); test_blob_to_node(); test_strlen(); test_strerror(); test_uri_parsing(); test_node_equals(); test_node_from_string(); test_node_from_substring(); test_simple_node(); test_literal(); test_uri_from_string(); test_relative_uri(); test_uri_resolution(); test_blank(); test_read_chunks(); test_read_string(); test_get_blank(); const char* const path = "serd_test.ttl"; test_writer(path); test_reader(path); printf("Success\n"); return 0; }