/* Copyright 2011-2021 David Robillard <d@drobilla.net> Permission to use, copy, modify, and/or distribute this software for any purpose with or without fee is hereby granted, provided that the above copyright notice and this permission notice appear in all copies. THIS SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */ #include "console.h" #include "serd/serd.h" #ifdef _WIN32 # ifdef _MSC_VER # define WIN32_LEAN_AND_MEAN 1 # endif # include <fcntl.h> # include <io.h> #endif #include <errno.h> #include <limits.h> #include <stdint.h> #include <stdlib.h> #include <string.h> SerdStatus serd_tool_setup(SerdTool* const tool, const char* const program, SerdCommonOptions options) { // Open the output first, since if that fails we have nothing to do const char* const out_path = options.out_filename; if (!(tool->out = serd_open_output(out_path, options.block_size))) { fprintf(stderr, "%s: failed to open output file (%s)\n", program, strerror(errno)); return SERD_ERR_UNKNOWN; } // We have something to write to, so build the writing environment if (!(tool->world = serd_world_new()) || !(tool->env = serd_create_env(program, options.base_uri, options.out_filename)) || !(tool->writer = serd_writer_new( tool->world, serd_choose_syntax( tool->world, options.output, options.out_filename, SERD_NQUADS), options.output.flags, tool->env, tool->out))) { fprintf(stderr, "%s: failed to set up writing environment\n", program); return SERD_ERR_INTERNAL; } return SERD_SUCCESS; } SerdStatus serd_tool_cleanup(const SerdTool tool) { SerdStatus st = SERD_SUCCESS; if (tool.out) { // Close the output stream explicitly to check if there were any errors if (serd_byte_sink_close(tool.out)) { perror("write error"); st = SERD_ERR_BAD_WRITE; } } serd_writer_free(tool.writer); serd_env_free(tool.env); serd_world_free(tool.world); serd_byte_sink_free(tool.out); return st; } void serd_set_stream_utf8_mode(FILE* const stream) { #ifdef _WIN32 _setmode(_fileno(stream), _O_BINARY); #else (void)stream; #endif } SerdStatus serd_print_version(const char* const program) { printf("%s %d.%d.%d <http://drobilla.net/software/serd>\n", program, SERD_MAJOR_VERSION, SERD_MINOR_VERSION, SERD_MICRO_VERSION); printf("Copyright 2011-2022 David Robillard <d@drobilla.net>.\n" "License: <http://www.opensource.org/licenses/isc>\n" "This is free software; you are free to change and redistribute it.\n" "There is NO WARRANTY, to the extent permitted by law.\n"); return SERD_FAILURE; } SerdStatus serd_get_argument(OptionIter* const iter, const char** const argument) { const char flag = iter->argv[iter->a][iter->f++]; if (iter->argv[iter->a][iter->f] || (iter->a + 1) == iter->argc) { fprintf( stderr, "%s: option requires an argument -- %c\n", iter->argv[0], flag); return SERD_ERR_BAD_ARG; } *argument = iter->argv[++iter->a]; ++iter->a; iter->f = 1; return SERD_SUCCESS; } SerdStatus serd_get_size_argument(OptionIter* const iter, size_t* const argument) { SerdStatus st = SERD_SUCCESS; const char* string = NULL; if ((st = serd_get_argument(iter, &string))) { return st; } char* endptr = NULL; const long size = strtol(string, &endptr, 10); if (size <= 0 || size == LONG_MAX || *endptr != '\0') { return SERD_ERR_BAD_ARG; } *argument = (size_t)size; return SERD_SUCCESS; } SerdStatus serd_set_input_option(const SerdStringView name, SerdSyntax* const syntax, SerdReaderFlags* const flags) { typedef struct { const char* name; SerdReaderFlag flag; } InputOption; static const InputOption input_options[] = { {"lax", SERD_READ_LAX}, {"variables", SERD_READ_VARIABLES}, {"relative", SERD_READ_RELATIVE}, {"global", SERD_READ_GLOBAL}, {"generated", SERD_READ_GENERATED}, {NULL, SERD_READ_LAX}, }; const SerdSyntax named_syntax = serd_syntax_by_name(name.buf); if (!serd_strncasecmp(name.buf, "empty", name.len) || named_syntax != SERD_SYNTAX_EMPTY) { *syntax = named_syntax; return SERD_SUCCESS; } for (const InputOption* o = input_options; o->name; ++o) { if (!serd_strncasecmp(o->name, name.buf, name.len)) { *flags |= o->flag; return SERD_SUCCESS; } } return SERD_ERR_BAD_ARG; } SerdStatus serd_parse_input_argument(OptionIter* const iter, SerdSyntaxOptions* const options) { SerdStatus st = SERD_SUCCESS; const char* argument = NULL; if (!(st = serd_get_argument(iter, &argument))) { if ((st = serd_set_input_option( SERD_STRING(argument), &options->syntax, &options->flags))) { fprintf(stderr, "%s: unknown option \"%s\"\n", iter->argv[0], argument); } else if (!strcmp(argument, "empty") || options->syntax) { options->overridden = true; } } return st; } SerdStatus serd_set_output_option(const SerdStringView name, SerdSyntax* const syntax, SerdWriterFlags* const flags) { typedef struct { const char* name; SerdWriterFlag flag; } OutputOption; static const OutputOption output_options[] = { {"ascii", SERD_WRITE_ASCII}, {"expanded", SERD_WRITE_EXPANDED}, {"verbatim", SERD_WRITE_VERBATIM}, {"terse", SERD_WRITE_TERSE}, {"lax", SERD_WRITE_LAX}, {"rdf_type", SERD_WRITE_RDF_TYPE}, {NULL, SERD_WRITE_ASCII}, }; const SerdSyntax named_syntax = serd_syntax_by_name(name.buf); if (!serd_strncasecmp(name.buf, "empty", name.len) || named_syntax != SERD_SYNTAX_EMPTY) { *syntax = named_syntax; return SERD_SUCCESS; } for (const OutputOption* o = output_options; o->name; ++o) { if (!serd_strncasecmp(o->name, name.buf, name.len)) { *flags |= o->flag; return SERD_SUCCESS; } } return SERD_ERR_BAD_ARG; } SerdStatus serd_parse_output_argument(OptionIter* const iter, SerdSyntaxOptions* const options) { SerdStatus st = SERD_SUCCESS; const char* argument = NULL; if (!(st = serd_get_argument(iter, &argument))) { if ((st = serd_set_output_option( SERD_STRING(argument), &options->syntax, &options->flags))) { fprintf(stderr, "%s: unknown option \"%s\"\n", iter->argv[0], argument); } else if (!strcmp(argument, "empty") || options->syntax) { options->overridden = true; } } return st; } SerdStatus serd_parse_common_option(OptionIter* const iter, SerdCommonOptions* const opts) { const char opt = iter->argv[iter->a][iter->f]; switch (opt) { case 'B': return serd_get_argument(iter, &opts->base_uri); case 'I': return serd_parse_input_argument(iter, &opts->input); case 'O': return serd_parse_output_argument(iter, &opts->output); case 'b': return serd_get_size_argument(iter, &opts->block_size); case 'k': return serd_get_size_argument(iter, &opts->stack_size); case 'o': return serd_get_argument(iter, &opts->out_filename); default: break; } return SERD_FAILURE; } SerdEnv* serd_create_env(const char* const program, const char* const base_string, const char* const out_filename) { const bool is_rebase = base_string && !strcmp(base_string, "rebase"); if (is_rebase && !out_filename) { fprintf(stderr, "%s: rebase requires an output filename\n", program); return NULL; } if (base_string && serd_uri_string_has_scheme(base_string)) { return serd_env_new(SERD_STRING(base_string)); } SerdEnv* const env = serd_env_new(SERD_EMPTY_STRING()); serd_set_base_uri_from_path(env, is_rebase ? out_filename : base_string); return env; } SerdSyntax serd_choose_syntax(SerdWorld* const world, const SerdSyntaxOptions options, const char* const filename, const SerdSyntax fallback) { if (options.overridden || options.syntax != SERD_SYNTAX_EMPTY) { return options.syntax; } if (!filename || !strcmp(filename, "-")) { return fallback; } const SerdSyntax guessed = serd_guess_syntax(filename); if (guessed != SERD_SYNTAX_EMPTY) { return guessed; } serd_logf(world, SERD_LOG_LEVEL_WARNING, "unable to determine syntax of \"%s\", trying TriG", filename); return SERD_TRIG; } /// Wrapper for getc that is compatible with SerdReadFunc but faster than fread static size_t serd_file_read_byte(void* buf, size_t size, size_t nmemb, void* stream) { (void)size; (void)nmemb; const int c = getc((FILE*)stream); if (c == EOF) { *((uint8_t*)buf) = 0; return 0; } *((uint8_t*)buf) = (uint8_t)c; return 1; } SerdByteSource* serd_open_input(const char* const filename, const size_t block_size) { SerdByteSource* byte_source = NULL; if (!strcmp(filename, "-")) { serd_set_stream_utf8_mode(stdin); SerdNode* name = serd_new_string(SERD_STRING("stdin")); byte_source = serd_byte_source_new_function( serd_file_read_byte, (SerdStreamErrorFunc)ferror, NULL, stdin, name, 1); serd_node_free(name); } else { byte_source = serd_byte_source_new_filename(filename, block_size); } return byte_source; } SerdByteSink* serd_open_output(const char* const filename, const size_t block_size) { if (!filename || !strcmp(filename, "-")) { serd_set_stream_utf8_mode(stdout); return serd_byte_sink_new_function( (SerdWriteFunc)fwrite, (SerdStreamCloseFunc)fclose, stdout, 1); } return serd_byte_sink_new_filename(filename, block_size); } SerdStatus serd_set_base_uri_from_path(SerdEnv* const env, const char* const path) { const size_t path_len = path ? strlen(path) : 0u; if (!path_len) { return SERD_ERR_BAD_ARG; } char* const real_path = serd_canonical_path(path); if (!real_path) { return SERD_ERR_BAD_ARG; } const size_t real_path_len = strlen(real_path); SerdNode* base_node = NULL; if (path[path_len - 1] == '/' || path[path_len - 1] == '\\') { char* const base_path = (char*)calloc(real_path_len + 2, 1); memcpy(base_path, real_path, real_path_len); base_path[real_path_len] = path[path_len - 1]; base_node = serd_new_file_uri(SERD_STRING(base_path), SERD_EMPTY_STRING()); free(base_path); } else { base_node = serd_new_file_uri(SERD_STRING(real_path), SERD_EMPTY_STRING()); } serd_env_set_base_uri(env, serd_node_string_view(base_node)); serd_node_free(base_node); serd_free(real_path); return SERD_SUCCESS; } SerdStatus serd_read_source(SerdWorld* const world, const SerdCommonOptions opts, SerdEnv* const env, const SerdSyntax syntax, SerdByteSource* const in, const SerdSink* const sink) { SerdReader* const reader = serd_reader_new( world, syntax, opts.input.flags, env, sink, opts.stack_size); SerdStatus st = serd_reader_start(reader, in); if (!st) { st = serd_reader_read_document(reader); } serd_reader_free(reader); return st; } SerdStatus serd_read_inputs(SerdWorld* const world, const SerdCommonOptions opts, SerdEnv* const env, const intptr_t n_inputs, char* const* const inputs, const SerdSink* const sink) { SerdStatus st = SERD_SUCCESS; for (intptr_t i = 0; !st && i < n_inputs; ++i) { // Use the filename as the base URI if possible if user didn't override it const char* const in_path = inputs[i]; if (!opts.base_uri[0] && strcmp(in_path, "-")) { serd_set_base_uri_from_path(env, in_path); } // Open the input stream SerdByteSource* const in = serd_open_input(in_path, opts.block_size); if (!in) { return SERD_ERR_BAD_ARG; } // Read the entire file st = serd_read_source( world, opts, env, serd_choose_syntax(world, opts.input, in_path, SERD_TRIG), in, sink); serd_byte_source_free(in); } return st; }