// Copyright 2011-2021 David Robillard // SPDX-License-Identifier: ISC #undef NDEBUG #include "serd/caret.h" #include "serd/env.h" #include "serd/event.h" #include "serd/input_stream.h" #include "serd/node.h" #include "serd/reader.h" #include "serd/sink.h" #include "serd/statement.h" #include "serd/status.h" #include "serd/stream.h" #include "serd/string_view.h" #include "serd/syntax.h" #include "serd/world.h" #include "zix/allocator.h" #include "zix/attributes.h" #include "zix/filesystem.h" #include "zix/path.h" #ifdef _WIN32 # include #endif #include #include #include #include typedef struct { int n_base; int n_prefix; int n_statement; int n_end; } ReaderTest; static SerdStatus test_sink(void* handle, const SerdEvent* event) { ReaderTest* rt = (ReaderTest*)handle; switch (event->type) { case SERD_BASE: ++rt->n_base; break; case SERD_PREFIX: ++rt->n_prefix; break; case SERD_STATEMENT: ++rt->n_statement; break; case SERD_END: ++rt->n_end; break; } return SERD_SUCCESS; } ZIX_PURE_FUNC static size_t prepare_test_read(void* buf, size_t size, size_t nmemb, void* stream) { assert(size == 1); assert(nmemb == 1); (void)buf; (void)size; (void)nmemb; (void)stream; return 0; } static int prepare_test_error(void* stream) { (void)stream; return 1; } static void test_prepare_error(const char* const path) { SerdWorld* const world = serd_world_new(); ReaderTest rt = {0, 0, 0, 0}; FILE* const f = fopen(path, "w+b"); assert(f); fprintf(f, "_:s _:o .\n"); fflush(f); fseek(f, 0L, SEEK_SET); SerdSink* const sink = serd_sink_new(&rt, test_sink, NULL); assert(sink); SerdEnv* const env = serd_env_new(serd_empty_string()); SerdReader* const reader = serd_reader_new(world, SERD_TURTLE, 0, env, sink); assert(reader); SerdInputStream in = serd_open_input_stream(prepare_test_read, prepare_test_error, NULL, f); assert(serd_reader_start(reader, &in, NULL, 0) == SERD_BAD_ARG); SerdStatus st = serd_reader_start(reader, &in, NULL, 1); assert(!st); assert(serd_reader_read_document(reader) == SERD_BAD_STREAM); serd_close_input(&in); serd_reader_free(reader); serd_env_free(env); serd_sink_free(sink); serd_world_free(world); fclose(f); assert(!zix_remove(path)); } static void test_read_string(void) { SerdWorld* world = serd_world_new(); ReaderTest rt = {0, 0, 0, 0}; SerdSink* sink = serd_sink_new(&rt, test_sink, NULL); assert(sink); SerdEnv* const env = serd_env_new(serd_empty_string()); SerdReader* const reader = serd_reader_new(world, SERD_TURTLE, 0U, env, sink); assert(reader); static const char* const string1 = " " " ."; const char* position = string1; SerdInputStream in = serd_open_input_string(&position); // Test reading a string that ends exactly at the end of input (no newline) assert(!serd_reader_start(reader, &in, NULL, 1)); assert(!serd_reader_read_document(reader)); assert(rt.n_base == 0); assert(rt.n_prefix == 0); assert(rt.n_statement == 1); assert(rt.n_end == 0); assert(!serd_reader_finish(reader)); assert(!serd_close_input(&in)); static const char* const string2 = " " " , _:blank ."; // Test reading a chunk rt.n_statement = 0; position = string2; in = serd_open_input_string(&position); assert(!serd_reader_start(reader, &in, NULL, 1)); assert(!serd_reader_read_chunk(reader)); assert(rt.n_statement == 2); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(!serd_reader_finish(reader)); assert(!serd_close_input(&in)); serd_reader_free(reader); serd_env_free(env); serd_sink_free(sink); serd_world_free(world); } /// Reads a null byte after a statement, then succeeds again (like a socket) static size_t eof_test_read(void* buf, size_t size, size_t nmemb, void* stream) { assert(size == 1); assert(nmemb == 1); (void)size; static const char* const string = "_:s1 _:o1 .\n" "_:s2 _:o2 .\n"; size_t* const count = (size_t*)stream; // Normal reading for the first statement if (*count < 35) { *(char*)buf = string[*count]; ++*count; return nmemb; } // EOF for the first read at the start of the second statement if (*count == 35) { assert(string[*count] == '_'); ++*count; return 0; } if (*count >= strlen(string)) { return 0; } // Normal reading after the EOF, adjusting for the skipped index 35 *(char*)buf = string[*count - 1]; ++*count; return nmemb; } static int eof_test_error(void* stream) { (void)stream; return 0; } /// A read of a big page hits EOF then fails to read chunks immediately static void test_read_eof_by_page(const char* const path) { FILE* const f = fopen(path, "w+b"); assert(f); fprintf(f, "_:s _:o .\n"); fflush(f); fseek(f, 0L, SEEK_SET); SerdWorld* world = serd_world_new(); ReaderTest ignored = {0, 0, 0, 0}; SerdSink* sink = serd_sink_new(&ignored, test_sink, NULL); SerdEnv* env = serd_env_new(serd_empty_string()); SerdReader* reader = serd_reader_new(world, SERD_TURTLE, 0U, env, sink); SerdInputStream in = serd_open_input_stream((SerdReadFunc)fread, (SerdErrorFunc)ferror, NULL, f); assert(serd_reader_start(reader, &in, NULL, 4096) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(!serd_reader_finish(reader)); assert(!serd_close_input(&in)); serd_reader_free(reader); serd_env_free(env); serd_sink_free(sink); serd_world_free(world); fclose(f); assert(!zix_remove(path)); } // A byte-wise reader hits EOF once then continues (like a socket) static void test_read_eof_by_byte(void) { SerdWorld* world = serd_world_new(); ReaderTest ignored = {0, 0, 0, 0}; SerdSink* sink = serd_sink_new(&ignored, test_sink, NULL); SerdEnv* env = serd_env_new(serd_empty_string()); SerdReader* reader = serd_reader_new(world, SERD_TURTLE, 0U, env, sink); size_t n_reads = 0U; SerdInputStream in = serd_open_input_stream( (SerdReadFunc)eof_test_read, (SerdErrorFunc)eof_test_error, NULL, &n_reads); assert(serd_reader_start(reader, &in, NULL, 1) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(serd_reader_read_chunk(reader) == SERD_SUCCESS); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(!serd_reader_finish(reader)); assert(!serd_close_input(&in)); serd_reader_free(reader); serd_env_free(env); serd_sink_free(sink); serd_world_free(world); } static void test_read_nquads_chunks(const char* const path) { static const char null = 0; FILE* const f = fopen(path, "w+b"); assert(f); // Write two statements, a null separator, then another statement fprintf(f, " " " .\n"); fprintf(f, " " " .\n"); fwrite(&null, sizeof(null), 1, f); fprintf(f, " " " .\n"); fseek(f, 0, SEEK_SET); SerdWorld* const world = serd_world_new(); ReaderTest rt = {0, 0, 0, 0}; SerdSink* const sink = serd_sink_new(&rt, test_sink, NULL); assert(sink); SerdEnv* const env = serd_env_new(serd_empty_string()); assert(env); SerdReader* const reader = serd_reader_new(world, SERD_TURTLE, 0U, env, sink); assert(reader); SerdInputStream in = serd_open_input_stream((SerdReadFunc)fread, (SerdErrorFunc)ferror, NULL, f); SerdStatus st = serd_reader_start(reader, &in, NULL, 1); assert(st == SERD_SUCCESS); // Read first statement st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt.n_base == 0); assert(rt.n_prefix == 0); assert(rt.n_statement == 1); assert(rt.n_end == 0); // Read second statement st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt.n_base == 0); assert(rt.n_prefix == 0); assert(rt.n_statement == 2); assert(rt.n_end == 0); // Read terminator st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(rt.n_base == 0); assert(rt.n_prefix == 0); assert(rt.n_statement == 2); assert(rt.n_end == 0); // Read last statement st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt.n_base == 0); assert(rt.n_prefix == 0); assert(rt.n_statement == 3); assert(rt.n_end == 0); // EOF st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(rt.n_base == 0); assert(rt.n_prefix == 0); assert(rt.n_statement == 3); assert(rt.n_end == 0); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(!serd_close_input(&in)); serd_reader_free(reader); serd_env_free(env); serd_sink_free(sink); serd_world_free(world); fclose(f); assert(!zix_remove(path)); } static void test_read_turtle_chunks(const char* const path) { static const char null = 0; FILE* const f = fopen(path, "w+b"); assert(f); // Write two statements separated by null characters fprintf(f, "@base .\n"); fprintf(f, "@prefix eg: .\n"); fprintf(f, "eg:s eg:p1 eg:o1 ;\n"); fprintf(f, " eg:p2 eg:o2 .\n"); fwrite(&null, sizeof(null), 1, f); fprintf(f, "eg:s eg:p [ eg:sp eg:so ] .\n"); fwrite(&null, sizeof(null), 1, f); fseek(f, 0, SEEK_SET); SerdWorld* world = serd_world_new(); ReaderTest rt = {0, 0, 0, 0}; SerdSink* sink = serd_sink_new(&rt, test_sink, NULL); assert(sink); SerdEnv* const env = serd_env_new(serd_empty_string()); assert(env); SerdReader* const reader = serd_reader_new(world, SERD_TURTLE, 0U, env, sink); assert(reader); SerdInputStream in = serd_open_input_stream((SerdReadFunc)fread, (SerdErrorFunc)ferror, NULL, f); SerdStatus st = serd_reader_start(reader, &in, NULL, 1); assert(st == SERD_SUCCESS); // Read base st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt.n_base == 1); assert(rt.n_prefix == 0); assert(rt.n_statement == 0); assert(rt.n_end == 0); // Read prefix st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt.n_base == 1); assert(rt.n_prefix == 1); assert(rt.n_statement == 0); assert(rt.n_end == 0); // Read first two statements st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt.n_base == 1); assert(rt.n_prefix == 1); assert(rt.n_statement == 2); assert(rt.n_end == 0); // Read terminator st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(rt.n_base == 1); assert(rt.n_prefix == 1); assert(rt.n_statement == 2); assert(rt.n_end == 0); // Read statements after null terminator st = serd_reader_read_chunk(reader); assert(st == SERD_SUCCESS); assert(rt.n_base == 1); assert(rt.n_prefix == 1); assert(rt.n_statement == 4); assert(rt.n_end == 1); // Read terminator st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(rt.n_base == 1); assert(rt.n_prefix == 1); assert(rt.n_statement == 4); assert(rt.n_end == 1); // EOF st = serd_reader_read_chunk(reader); assert(st == SERD_FAILURE); assert(rt.n_base == 1); assert(rt.n_prefix == 1); assert(rt.n_statement == 4); assert(rt.n_end == 1); assert(serd_reader_read_chunk(reader) == SERD_FAILURE); assert(!serd_close_input(&in)); serd_reader_free(reader); serd_env_free(env); serd_sink_free(sink); serd_world_free(world); fclose(f); assert(!zix_remove(path)); } /// Test that reading SERD_SYNTAX_EMPTY "succeeds" without reading any input static void test_read_empty(const char* const path) { SerdWorld* const world = serd_world_new(); ReaderTest rt = {0, 0, 0, 0}; SerdSink* const sink = serd_sink_new(&rt, test_sink, NULL); assert(sink); SerdEnv* const env = serd_env_new(serd_empty_string()); assert(env); SerdReader* const reader = serd_reader_new(world, SERD_SYNTAX_EMPTY, 0U, env, sink); assert(reader); FILE* const f = fopen(path, "w+b"); assert(f); SerdInputStream in = serd_open_input_stream((SerdReadFunc)fread, (SerdErrorFunc)ferror, NULL, f); SerdStatus st = serd_reader_start(reader, &in, NULL, 1); assert(!st); assert(serd_reader_read_document(reader) == SERD_SUCCESS); assert(rt.n_statement == 0); assert(!serd_reader_finish(reader)); assert(!serd_close_input(&in)); fclose(f); assert(!zix_remove(path)); serd_reader_free(reader); serd_env_free(env); serd_sink_free(sink); serd_world_free(world); } static SerdStatus check_cursor(void* handle, const SerdEvent* event) { bool* const called = (bool*)handle; if (event->type == SERD_STATEMENT) { const SerdCaret* const caret = serd_statement_caret(event->statement.statement); assert(caret); assert(!strcmp(serd_node_string(serd_caret_document(caret)), "string")); assert(serd_caret_line(caret) == 1); assert(serd_caret_column(caret) == 47); } *called = true; return SERD_SUCCESS; } static void test_error_cursor(void) { SerdWorld* world = serd_world_new(); bool called = false; SerdSink* sink = serd_sink_new(&called, check_cursor, NULL); SerdEnv* const env = serd_env_new(serd_empty_string()); SerdReader* const reader = serd_reader_new(world, SERD_TURTLE, 0U, env, sink); assert(sink); assert(reader); static const char* const string = " " " ."; SerdNode* const string_name = serd_new_string(serd_string("string")); const char* position = string; SerdInputStream in = serd_open_input_string(&position); SerdStatus st = serd_reader_start(reader, &in, string_name, 1); assert(!st); assert(serd_reader_read_document(reader) == SERD_SUCCESS); assert(!serd_reader_finish(reader)); assert(called); assert(!serd_close_input(&in)); serd_node_free(string_name); serd_reader_free(reader); serd_env_free(env); serd_sink_free(sink); serd_world_free(world); } int main(void) { char* const temp = zix_temp_directory_path(NULL); char* const path_pattern = zix_path_join(NULL, temp, "serdXXXXXX"); char* const dir = zix_create_temporary_directory(NULL, path_pattern); char* const ttl_path = zix_path_join(NULL, dir, "serd_test_reader.ttl"); char* const nq_path = zix_path_join(NULL, dir, "serd_test_reader.nq"); test_read_nquads_chunks(nq_path); test_read_turtle_chunks(ttl_path); test_prepare_error(ttl_path); test_read_string(); test_read_eof_by_page(ttl_path); test_read_eof_by_byte(); test_read_nquads_chunks(nq_path); test_read_turtle_chunks(ttl_path); test_read_empty(ttl_path); test_error_cursor(); assert(!zix_remove(dir)); zix_free(NULL, nq_path); zix_free(NULL, ttl_path); zix_free(NULL, dir); zix_free(NULL, path_pattern); zix_free(NULL, temp); return 0; }