cannam@115: /* cannam@115: Copyright 2011-2013 David Robillard cannam@115: cannam@115: Permission to use, copy, modify, and/or distribute this software for any cannam@115: purpose with or without fee is hereby granted, provided that the above cannam@115: copyright notice and this permission notice appear in all copies. cannam@115: cannam@115: THIS SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES cannam@115: WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF cannam@115: MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR cannam@115: ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES cannam@115: WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN cannam@115: ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF cannam@115: OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. cannam@115: */ cannam@115: cannam@115: /** cannam@115: @file sord.h API for Sord, a lightweight RDF model library. cannam@115: */ cannam@115: cannam@115: #ifndef SORD_SORD_H cannam@115: #define SORD_SORD_H cannam@115: cannam@115: #include cannam@115: #include cannam@115: #include cannam@115: cannam@115: #include "serd/serd.h" cannam@115: cannam@115: #ifdef SORD_SHARED cannam@115: # ifdef _WIN32 cannam@115: # define SORD_LIB_IMPORT __declspec(dllimport) cannam@115: # define SORD_LIB_EXPORT __declspec(dllexport) cannam@115: # else cannam@115: # define SORD_LIB_IMPORT __attribute__((visibility("default"))) cannam@115: # define SORD_LIB_EXPORT __attribute__((visibility("default"))) cannam@115: # endif cannam@115: # ifdef SORD_INTERNAL cannam@115: # define SORD_API SORD_LIB_EXPORT cannam@115: # else cannam@115: # define SORD_API SORD_LIB_IMPORT cannam@115: # endif cannam@115: #else cannam@115: # define SORD_API cannam@115: #endif cannam@115: cannam@115: #ifdef __cplusplus cannam@115: extern "C" { cannam@115: #else cannam@115: # include cannam@115: #endif cannam@115: cannam@115: /** cannam@115: @defgroup sord Sord cannam@115: A lightweight RDF model library. cannam@115: cannam@115: Sord stores RDF (subject object predicate context) quads, where the context cannam@115: may be omitted (to represent triples in the default graph). cannam@115: @{ cannam@115: */ cannam@115: cannam@115: /** cannam@115: Sord World. cannam@115: The World represents all library state, including interned strings. cannam@115: */ cannam@115: typedef struct SordWorldImpl SordWorld; cannam@115: cannam@115: /** cannam@115: Sord Model. cannam@115: cannam@115: A model is an indexed set of Quads (i.e. it can contain several RDF cannam@115: graphs). It may be searched using various patterns depending on which cannam@115: indices are enabled. cannam@115: */ cannam@115: typedef struct SordModelImpl SordModel; cannam@115: cannam@115: /** cannam@115: Model Inserter. cannam@115: cannam@115: An inserter is used for writing statements to a model using the Serd sink cannam@115: interface. This makes it simple to write to a model directly using a cannam@115: SerdReader, or any other code that writes statements to a SerdStatementSink. cannam@115: */ cannam@115: typedef struct SordInserterImpl SordInserter; cannam@115: cannam@115: /** cannam@115: Model Iterator. cannam@115: */ cannam@115: typedef struct SordIterImpl SordIter; cannam@115: cannam@115: /** cannam@115: RDF Node. cannam@115: A Node is a component of a Quad. Nodes may be URIs, blank nodes, or cannam@115: (in the case of quad objects only) string literals. Literal nodes may cannam@115: have an associate language or datatype (but not both). cannam@115: */ cannam@115: typedef struct SordNodeImpl SordNode; cannam@115: cannam@115: /** cannam@115: Quad of nodes (a statement), or a quad pattern. cannam@115: cannam@115: Nodes are ordered (S P O G). The ID of the default graph is 0. cannam@115: */ cannam@115: typedef const SordNode* SordQuad[4]; cannam@115: cannam@115: /** cannam@115: Index into a SordQuad. cannam@115: */ cannam@115: typedef enum { cannam@115: SORD_SUBJECT = 0, /**< Subject */ cannam@115: SORD_PREDICATE = 1, /**< Predicate (a.k.a. "key") */ cannam@115: SORD_OBJECT = 2, /**< Object (a.k.a. "value") */ cannam@115: SORD_GRAPH = 3 /**< Graph (a.k.a. "context") */ cannam@115: } SordQuadIndex; cannam@115: cannam@115: /** cannam@115: Type of a node. cannam@115: */ cannam@115: typedef enum { cannam@115: SORD_URI = 1, /**< URI */ cannam@115: SORD_BLANK = 2, /**< Blank node identifier */ cannam@115: SORD_LITERAL = 3 /**< Literal (string with optional lang or datatype) */ cannam@115: } SordNodeType; cannam@115: cannam@115: /** cannam@115: Indexing option. cannam@115: */ cannam@115: typedef enum { cannam@115: SORD_SPO = 1, /**< Subject, Predicate, Object */ cannam@115: SORD_SOP = 1 << 1, /**< Subject, Object, Predicate */ cannam@115: SORD_OPS = 1 << 2, /**< Object, Predicate, Subject */ cannam@115: SORD_OSP = 1 << 3, /**< Object, Subject, Predicate */ cannam@115: SORD_PSO = 1 << 4, /**< Predicate, Subject, Object */ cannam@115: SORD_POS = 1 << 5 /**< Predicate, Object, Subject */ cannam@115: } SordIndexOption; cannam@115: cannam@115: /** cannam@115: @name World cannam@115: @{ cannam@115: */ cannam@115: cannam@115: /** cannam@115: Create a new Sord World. cannam@115: It is safe to use multiple worlds in one process, though no data cannam@115: (e.g. nodes) can be shared between worlds, and this should be avoided if cannam@115: possible for performance reasons. cannam@115: */ cannam@115: SORD_API cannam@115: SordWorld* cannam@115: sord_world_new(void); cannam@115: cannam@115: /** cannam@115: Free @c world. cannam@115: */ cannam@115: SORD_API cannam@115: void cannam@115: sord_world_free(SordWorld* world); cannam@115: cannam@115: /** cannam@115: Set a function to be called when errors occur. cannam@115: cannam@115: The @p error_sink will be called with @p handle as its first argument. If cannam@115: no error function is set, errors are printed to stderr. cannam@115: */ cannam@115: SORD_API cannam@115: void cannam@115: sord_world_set_error_sink(SordWorld* world, cannam@115: SerdErrorSink error_sink, cannam@115: void* handle); cannam@115: cannam@115: /** cannam@115: @} cannam@115: @name Node cannam@115: @{ cannam@115: */ cannam@115: cannam@115: /** cannam@115: Get a URI node from a string. cannam@115: cannam@115: Note this function measures @c str, which is a common bottleneck. cannam@115: Use sord_node_from_serd_node instead if @c str is already measured. cannam@115: */ cannam@115: SORD_API cannam@115: SordNode* cannam@115: sord_new_uri(SordWorld* world, const uint8_t* uri); cannam@115: cannam@115: /** cannam@115: Get a URI node from a relative URI string. cannam@115: */ cannam@115: SORD_API cannam@115: SordNode* cannam@115: sord_new_relative_uri(SordWorld* world, cannam@115: const uint8_t* str, cannam@115: const uint8_t* base_uri); cannam@115: cannam@115: /** cannam@115: Get a blank node from a string. cannam@115: cannam@115: Note this function measures @c str, which is a common bottleneck. cannam@115: Use sord_node_from_serd_node instead if @c str is already measured. cannam@115: */ cannam@115: SORD_API cannam@115: SordNode* cannam@115: sord_new_blank(SordWorld* world, const uint8_t* str); cannam@115: cannam@115: /** cannam@115: Get a literal node from a string. cannam@115: cannam@115: Note this function measures @c str, which is a common bottleneck. cannam@115: Use sord_node_from_serd_node instead if @c str is already measured. cannam@115: */ cannam@115: SORD_API cannam@115: SordNode* cannam@115: sord_new_literal(SordWorld* world, cannam@115: SordNode* datatype, cannam@115: const uint8_t* str, cannam@115: const char* lang); cannam@115: cannam@115: /** cannam@115: Copy a node (obtain a reference). cannam@115: cannam@115: Node that since nodes are interned and reference counted, this does not cannam@115: actually create a deep copy of @c node. cannam@115: */ cannam@115: SORD_API cannam@115: SordNode* cannam@115: sord_node_copy(const SordNode* node); cannam@115: cannam@115: /** cannam@115: Free a node (drop a reference). cannam@115: */ cannam@115: SORD_API cannam@115: void cannam@115: sord_node_free(SordWorld* world, SordNode* node); cannam@115: cannam@115: /** cannam@115: Return the type of a node (SORD_URI, SORD_BLANK, or SORD_LITERAL). cannam@115: */ cannam@115: SORD_API cannam@115: SordNodeType cannam@115: sord_node_get_type(const SordNode* node); cannam@115: cannam@115: /** cannam@115: Return the string value of a node. cannam@115: */ cannam@115: SORD_API cannam@115: const uint8_t* cannam@115: sord_node_get_string(const SordNode* node); cannam@115: cannam@115: /** cannam@115: Return the string value of a node, and set @c len to its length. cannam@115: */ cannam@115: SORD_API cannam@115: const uint8_t* cannam@115: sord_node_get_string_counted(const SordNode* node, size_t* len); cannam@115: cannam@115: /** cannam@115: Return the language of a literal node (or NULL). cannam@115: */ cannam@115: SORD_API cannam@115: const char* cannam@115: sord_node_get_language(const SordNode* node); cannam@115: cannam@115: /** cannam@115: Return the datatype URI of a literal node (or NULL). cannam@115: */ cannam@115: SORD_API cannam@115: SordNode* cannam@115: sord_node_get_datatype(const SordNode* node); cannam@115: cannam@115: /** cannam@115: Return the flags (string attributes) of a node. cannam@115: */ cannam@115: SORD_API cannam@115: SerdNodeFlags cannam@115: sord_node_get_flags(const SordNode* node); cannam@115: cannam@115: /** cannam@115: Return true iff node can be serialised as an inline object. cannam@115: cannam@115: More specifically, this returns true iff the node is the object field cannam@115: of exactly one statement, and therefore can be inlined since it needn't cannam@115: be referred to by name. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_node_is_inline_object(const SordNode* node); cannam@115: cannam@115: /** cannam@115: Return true iff @c a is equal to @c b. cannam@115: cannam@115: Note this is much faster than comparing the node's strings. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_node_equals(const SordNode* a, cannam@115: const SordNode* b); cannam@115: cannam@115: /** cannam@115: Return a SordNode as a SerdNode. cannam@115: cannam@115: The returned node is shared and must not be freed or modified. cannam@115: */ cannam@115: SORD_API cannam@115: const SerdNode* cannam@115: sord_node_to_serd_node(const SordNode* node); cannam@115: cannam@115: /** cannam@115: Create a new SordNode from a SerdNode. cannam@115: cannam@115: The returned node must be freed using sord_node_free. cannam@115: */ cannam@115: SORD_API cannam@115: SordNode* cannam@115: sord_node_from_serd_node(SordWorld* world, cannam@115: SerdEnv* env, cannam@115: const SerdNode* node, cannam@115: const SerdNode* datatype, cannam@115: const SerdNode* lang); cannam@115: cannam@115: /** cannam@115: @} cannam@115: @name Model cannam@115: @{ cannam@115: */ cannam@115: cannam@115: /** cannam@115: Create a new model. cannam@115: cannam@115: @param world The world in which to make this model. cannam@115: cannam@115: @param indices SordIndexOption flags (e.g. SORD_SPO|SORD_OPS). Be sure to cannam@115: enable an index where the most significant node(s) are not variables in your cannam@115: queries (e.g. to make (? P O) queries, enable either SORD_OPS or SORD_POS). cannam@115: cannam@115: @param graphs If true, store (and index) graph contexts. cannam@115: */ cannam@115: SORD_API cannam@115: SordModel* cannam@115: sord_new(SordWorld* world, cannam@115: unsigned indices, cannam@115: bool graphs); cannam@115: cannam@115: /** cannam@115: Close and free @c model. cannam@115: */ cannam@115: SORD_API cannam@115: void cannam@115: sord_free(SordModel* model); cannam@115: cannam@115: /** cannam@115: Get the world associated with @c model. cannam@115: */ cannam@115: SORD_API cannam@115: SordWorld* cannam@115: sord_get_world(SordModel* model); cannam@115: cannam@115: /** cannam@115: Return the number of nodes stored in @c world. cannam@115: cannam@115: Nodes are included in this count iff they are a part of a quad in @c world. cannam@115: */ cannam@115: SORD_API cannam@115: size_t cannam@115: sord_num_nodes(const SordWorld* world); cannam@115: cannam@115: /** cannam@115: Return the number of quads stored in @c model. cannam@115: */ cannam@115: SORD_API cannam@115: size_t cannam@115: sord_num_quads(const SordModel* model); cannam@115: cannam@115: /** cannam@115: Return an iterator to the start of @c model. cannam@115: */ cannam@115: SORD_API cannam@115: SordIter* cannam@115: sord_begin(const SordModel* model); cannam@115: cannam@115: /** cannam@115: Search for statements by a quad pattern. cannam@115: @return an iterator to the first match, or NULL if no matches found. cannam@115: */ cannam@115: SORD_API cannam@115: SordIter* cannam@115: sord_find(SordModel* model, const SordQuad pat); cannam@115: cannam@115: /** cannam@115: Search for statements by nodes. cannam@115: @return an iterator to the first match, or NULL if no matches found. cannam@115: */ cannam@115: SORD_API cannam@115: SordIter* cannam@115: sord_search(SordModel* model, cannam@115: const SordNode* s, cannam@115: const SordNode* p, cannam@115: const SordNode* o, cannam@115: const SordNode* g); cannam@115: /** cannam@115: Search for a single node that matches a pattern. cannam@115: Exactly one of @p s, @p p, @p o must be NULL. cannam@115: This function is mainly useful for predicates that only have one value. cannam@115: The returned node must be freed using sord_node_free. cannam@115: @return the first matching node, or NULL if no matches are found. cannam@115: */ cannam@115: SORD_API cannam@115: SordNode* cannam@115: sord_get(SordModel* model, cannam@115: const SordNode* s, cannam@115: const SordNode* p, cannam@115: const SordNode* o, cannam@115: const SordNode* g); cannam@115: cannam@115: /** cannam@115: Return true iff a statement exists. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_ask(SordModel* model, cannam@115: const SordNode* s, cannam@115: const SordNode* p, cannam@115: const SordNode* o, cannam@115: const SordNode* g); cannam@115: cannam@115: /** cannam@115: Return the number of matching statements. cannam@115: */ cannam@115: SORD_API cannam@115: uint64_t cannam@115: sord_count(SordModel* model, cannam@115: const SordNode* s, cannam@115: const SordNode* p, cannam@115: const SordNode* o, cannam@115: const SordNode* g); cannam@115: cannam@115: /** cannam@115: Check if @a model contains a triple pattern. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_contains(SordModel* model, const SordQuad pat); cannam@115: cannam@115: /** cannam@115: Add a quad to a model. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_add(SordModel* model, const SordQuad quad); cannam@115: cannam@115: /** cannam@115: Remove a quad from a model. cannam@115: cannam@115: Note that is it illegal to remove while iterating over @c model. cannam@115: */ cannam@115: SORD_API cannam@115: void cannam@115: sord_remove(SordModel* model, const SordQuad quad); cannam@115: cannam@115: /** cannam@115: @} cannam@115: @name Inserter cannam@115: @{ cannam@115: */ cannam@115: cannam@115: /** cannam@115: Create an inserter for writing statements to a model. cannam@115: */ cannam@115: SORD_API cannam@115: SordInserter* cannam@115: sord_inserter_new(SordModel* model, cannam@115: SerdEnv* env); cannam@115: cannam@115: /** cannam@115: Free an inserter. cannam@115: */ cannam@115: SORD_API cannam@115: void cannam@115: sord_inserter_free(SordInserter* inserter); cannam@115: cannam@115: /** cannam@115: Set the current base URI for writing to the model. cannam@115: cannam@115: Note this function can be safely casted to SerdBaseSink. cannam@115: */ cannam@115: SORD_API cannam@115: SerdStatus cannam@115: sord_inserter_set_base_uri(SordInserter* inserter, cannam@115: const SerdNode* uri); cannam@115: cannam@115: /** cannam@115: Set a namespace prefix for writing to the model. cannam@115: cannam@115: Note this function can be safely casted to SerdPrefixSink. cannam@115: */ cannam@115: SORD_API cannam@115: SerdStatus cannam@115: sord_inserter_set_prefix(SordInserter* inserter, cannam@115: const SerdNode* name, cannam@115: const SerdNode* uri); cannam@115: cannam@115: /** cannam@115: Write a statement to the model. cannam@115: cannam@115: Note this function can be safely casted to SerdStatementSink. cannam@115: */ cannam@115: SORD_API cannam@115: SerdStatus cannam@115: sord_inserter_write_statement(SordInserter* inserter, cannam@115: SerdStatementFlags flags, cannam@115: const SerdNode* graph, cannam@115: const SerdNode* subject, cannam@115: const SerdNode* predicate, cannam@115: const SerdNode* object, cannam@115: const SerdNode* object_datatype, cannam@115: const SerdNode* object_lang); cannam@115: cannam@115: /** cannam@115: @} cannam@115: @name Iteration cannam@115: @{ cannam@115: */ cannam@115: cannam@115: /** cannam@115: Set @c quad to the quad pointed to by @c iter. cannam@115: */ cannam@115: SORD_API cannam@115: void cannam@115: sord_iter_get(const SordIter* iter, SordQuad quad); cannam@115: cannam@115: /** cannam@115: Return a field of the quad pointed to by @c iter. cannam@115: */ cannam@115: SORD_API cannam@115: const SordNode* cannam@115: sord_iter_get_node(const SordIter* iter, SordQuadIndex index); cannam@115: cannam@115: /** cannam@115: Return the store pointed to by @c iter. cannam@115: */ cannam@115: SORD_API cannam@115: const SordModel* cannam@115: sord_iter_get_model(SordIter* iter); cannam@115: cannam@115: /** cannam@115: Increment @c iter to point to the next statement. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_iter_next(SordIter* iter); cannam@115: cannam@115: /** cannam@115: Return true iff @c iter is at the end of its range. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_iter_end(const SordIter* iter); cannam@115: cannam@115: /** cannam@115: Free @c iter. cannam@115: */ cannam@115: SORD_API cannam@115: void cannam@115: sord_iter_free(SordIter* iter); cannam@115: cannam@115: /** cannam@115: @} cannam@115: @name Utilities cannam@115: @{ cannam@115: */ cannam@115: cannam@115: /** cannam@115: Match two quads (using ID comparison only). cannam@115: cannam@115: This function is a straightforward and fast equivalence match with wildcard cannam@115: support (ID 0 is a wildcard). It does not actually read node data. cannam@115: @return true iff @c x and @c y match. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_quad_match(const SordQuad x, const SordQuad y); cannam@115: cannam@115: /** cannam@115: @} cannam@115: @name Serialisation cannam@115: @{ cannam@115: */ cannam@115: cannam@115: /** cannam@115: Return a reader that will read into @c model. cannam@115: */ cannam@115: SORD_API cannam@115: SerdReader* cannam@115: sord_new_reader(SordModel* model, cannam@115: SerdEnv* env, cannam@115: SerdSyntax syntax, cannam@115: SordNode* graph); cannam@115: cannam@115: /** cannam@115: Write a model to a writer. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_write(SordModel* model, cannam@115: SerdWriter* writer, cannam@115: SordNode* graph); cannam@115: cannam@115: /** cannam@115: Write a range to a writer. cannam@115: cannam@115: This increments @c iter to its end, then frees it. cannam@115: */ cannam@115: SORD_API cannam@115: bool cannam@115: sord_write_iter(SordIter* iter, cannam@115: SerdWriter* writer); cannam@115: cannam@115: /** cannam@115: @} cannam@115: @} cannam@115: */ cannam@115: cannam@115: #ifdef __cplusplus cannam@115: } /* extern "C" */ cannam@115: #endif cannam@115: cannam@115: #endif /* SORD_SORD_H */