cannam@226: /* cannam@226: Copyright 2011-2016 David Robillard cannam@226: cannam@226: Permission to use, copy, modify, and/or distribute this software for any cannam@226: purpose with or without fee is hereby granted, provided that the above cannam@226: copyright notice and this permission notice appear in all copies. cannam@226: cannam@226: THIS SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES cannam@226: WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF cannam@226: MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR cannam@226: ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES cannam@226: WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN cannam@226: ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF cannam@226: OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. cannam@226: */ cannam@226: cannam@226: #include "serd_internal.h" cannam@226: cannam@226: #include cannam@226: #include cannam@226: cannam@226: #include cannam@226: #include cannam@226: cannam@226: #ifdef _WIN32 cannam@226: # ifndef isnan cannam@226: # define isnan(x) _isnan(x) cannam@226: # endif cannam@226: # ifndef isinf cannam@226: # define isinf(x) (!_finite(x)) cannam@226: # endif cannam@226: #endif cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_from_string(SerdType type, const uint8_t* buf) cannam@226: { cannam@226: if (!buf) { cannam@226: return SERD_NODE_NULL; cannam@226: } cannam@226: cannam@226: uint32_t flags = 0; cannam@226: size_t buf_n_bytes = 0; cannam@226: const size_t buf_n_chars = serd_strlen(buf, &buf_n_bytes, &flags); cannam@226: SerdNode ret = { buf, buf_n_bytes, buf_n_chars, flags, type }; cannam@226: return ret; cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_copy(const SerdNode* node) cannam@226: { cannam@226: if (!node || !node->buf) { cannam@226: return SERD_NODE_NULL; cannam@226: } cannam@226: cannam@226: SerdNode copy = *node; cannam@226: uint8_t* buf = (uint8_t*)malloc(copy.n_bytes + 1); cannam@226: memcpy(buf, node->buf, copy.n_bytes + 1); cannam@226: copy.buf = buf; cannam@226: return copy; cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: bool cannam@226: serd_node_equals(const SerdNode* a, const SerdNode* b) cannam@226: { cannam@226: return (a == b) cannam@226: || (a->type == b->type cannam@226: && a->n_bytes == b->n_bytes cannam@226: && a->n_chars == b->n_chars cannam@226: && ((a->buf == b->buf) || !memcmp((const char*)a->buf, cannam@226: (const char*)b->buf, cannam@226: a->n_bytes + 1))); cannam@226: } cannam@226: cannam@226: static size_t cannam@226: serd_uri_string_length(const SerdURI* uri) cannam@226: { cannam@226: size_t len = uri->path_base.len; cannam@226: cannam@226: #define ADD_LEN(field, n_delims) \ cannam@226: if ((field).len) { len += (field).len + (n_delims); } cannam@226: cannam@226: ADD_LEN(uri->path, 1); // + possible leading `/' cannam@226: ADD_LEN(uri->scheme, 1); // + trailing `:' cannam@226: ADD_LEN(uri->authority, 2); // + leading `//' cannam@226: ADD_LEN(uri->query, 1); // + leading `?' cannam@226: ADD_LEN(uri->fragment, 1); // + leading `#' cannam@226: cannam@226: return len + 2; // + 2 for authority `//' cannam@226: } cannam@226: cannam@226: static size_t cannam@226: string_sink(const void* buf, size_t len, void* stream) cannam@226: { cannam@226: uint8_t** ptr = (uint8_t**)stream; cannam@226: memcpy(*ptr, buf, len); cannam@226: *ptr += len; cannam@226: return len; cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_new_uri_from_node(const SerdNode* uri_node, cannam@226: const SerdURI* base, cannam@226: SerdURI* out) cannam@226: { cannam@226: return (uri_node->type == SERD_URI && uri_node->buf) cannam@226: ? serd_node_new_uri_from_string(uri_node->buf, base, out) cannam@226: : SERD_NODE_NULL; cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_new_uri_from_string(const uint8_t* str, cannam@226: const SerdURI* base, cannam@226: SerdURI* out) cannam@226: { cannam@226: if (!str || str[0] == '\0') { cannam@226: // Empty URI => Base URI, or nothing if no base is given cannam@226: return base ? serd_node_new_uri(base, NULL, out) : SERD_NODE_NULL; cannam@226: } cannam@226: cannam@226: SerdURI uri; cannam@226: serd_uri_parse(str, &uri); cannam@226: return serd_node_new_uri(&uri, base, out); // Resolve/Serialise cannam@226: } cannam@226: cannam@226: static inline bool cannam@226: is_uri_path_char(const uint8_t c) cannam@226: { cannam@226: if (is_alpha(c) || is_digit(c)) { cannam@226: return true; cannam@226: } cannam@226: switch (c) { cannam@226: case '-': case '.': case '_': case '~': // unreserved cannam@226: case ':': case '@': // pchar cannam@226: case '/': // separator cannam@226: // sub-delims cannam@226: case '!': case '$': case '&': case '\'': case '(': case ')': cannam@226: case '*': case '+': case ',': case ';': case '=': cannam@226: return true; cannam@226: default: cannam@226: return false; cannam@226: } cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_new_file_uri(const uint8_t* path, cannam@226: const uint8_t* hostname, cannam@226: SerdURI* out, cannam@226: bool escape) cannam@226: { cannam@226: const size_t path_len = strlen((const char*)path); cannam@226: const size_t hostname_len = hostname ? strlen((const char*)hostname) : 0; cannam@226: const bool evil = is_windows_path(path); cannam@226: size_t uri_len = 0; cannam@226: uint8_t* uri = NULL; cannam@226: cannam@226: if (path[0] == '/' || is_windows_path(path)) { cannam@226: uri_len = strlen("file://") + hostname_len + evil; cannam@226: uri = (uint8_t*)malloc(uri_len + 1); cannam@226: snprintf((char*)uri, uri_len + 1, "file://%s%s", cannam@226: hostname ? (const char*)hostname : "", cannam@226: evil ? "/" : ""); cannam@226: } cannam@226: cannam@226: SerdChunk chunk = { uri, uri_len }; cannam@226: for (size_t i = 0; i < path_len; ++i) { cannam@226: if (evil && path[i] == '\\') { cannam@226: serd_chunk_sink("/", 1, &chunk); cannam@226: } else if (path[i] == '%') { cannam@226: serd_chunk_sink("%%", 2, &chunk); cannam@226: } else if (!escape || is_uri_path_char(path[i])) { cannam@226: serd_chunk_sink(path + i, 1, &chunk); cannam@226: } else { cannam@226: char escape_str[4] = { '%', 0, 0, 0 }; cannam@226: snprintf(escape_str + 1, sizeof(escape_str) - 1, "%X", path[i]); cannam@226: serd_chunk_sink(escape_str, 3, &chunk); cannam@226: } cannam@226: } cannam@226: serd_chunk_sink_finish(&chunk); cannam@226: cannam@226: if (out) { cannam@226: serd_uri_parse(chunk.buf, out); cannam@226: } cannam@226: cannam@226: return serd_node_from_string(SERD_URI, chunk.buf); cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_new_uri(const SerdURI* uri, const SerdURI* base, SerdURI* out) cannam@226: { cannam@226: SerdURI abs_uri = *uri; cannam@226: if (base) { cannam@226: serd_uri_resolve(uri, base, &abs_uri); cannam@226: } cannam@226: cannam@226: const size_t len = serd_uri_string_length(&abs_uri); cannam@226: uint8_t* buf = (uint8_t*)malloc(len + 1); cannam@226: SerdNode node = { buf, 0, 0, 0, SERD_URI }; cannam@226: uint8_t* ptr = buf; cannam@226: const size_t actual_len = serd_uri_serialise(&abs_uri, string_sink, &ptr); cannam@226: cannam@226: buf[actual_len] = '\0'; cannam@226: node.n_bytes = actual_len; cannam@226: node.n_chars = serd_strlen(buf, NULL, NULL); cannam@226: cannam@226: if (out) { cannam@226: serd_uri_parse(buf, out); // TODO: cleverly avoid double parse cannam@226: } cannam@226: cannam@226: return node; cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_new_relative_uri(const SerdURI* uri, cannam@226: const SerdURI* base, cannam@226: const SerdURI* root, cannam@226: SerdURI* out) cannam@226: { cannam@226: const size_t uri_len = serd_uri_string_length(uri); cannam@226: const size_t base_len = serd_uri_string_length(base); cannam@226: uint8_t* buf = (uint8_t*)malloc(uri_len + base_len + 1); cannam@226: SerdNode node = { buf, 0, 0, 0, SERD_URI }; cannam@226: uint8_t* ptr = buf; cannam@226: const size_t actual_len = serd_uri_serialise_relative( cannam@226: uri, base, root, string_sink, &ptr); cannam@226: cannam@226: buf[actual_len] = '\0'; cannam@226: node.n_bytes = actual_len; cannam@226: node.n_chars = serd_strlen(buf, NULL, NULL); cannam@226: cannam@226: if (out) { cannam@226: serd_uri_parse(buf, out); // TODO: cleverly avoid double parse cannam@226: } cannam@226: cannam@226: return node; cannam@226: } cannam@226: cannam@226: static inline unsigned cannam@226: serd_digits(double abs) cannam@226: { cannam@226: const double lg = ceil(log10(floor(abs) + 1.0)); cannam@226: return lg < 1.0 ? 1U : (unsigned)lg; cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_new_decimal(double d, unsigned frac_digits) cannam@226: { cannam@226: if (isnan(d) || isinf(d)) { cannam@226: return SERD_NODE_NULL; cannam@226: } cannam@226: cannam@226: const double abs_d = fabs(d); cannam@226: const unsigned int_digits = serd_digits(abs_d); cannam@226: char* buf = (char*)calloc(int_digits + frac_digits + 3, 1); cannam@226: SerdNode node = { (const uint8_t*)buf, 0, 0, 0, SERD_LITERAL }; cannam@226: const double int_part = floor(abs_d); cannam@226: cannam@226: // Point s to decimal point location cannam@226: char* s = buf + int_digits; cannam@226: if (d < 0.0) { cannam@226: *buf = '-'; cannam@226: ++s; cannam@226: } cannam@226: cannam@226: // Write integer part (right to left) cannam@226: char* t = s - 1; cannam@226: uint64_t dec = (uint64_t)int_part; cannam@226: do { cannam@226: *t-- = '0' + (dec % 10); cannam@226: } while ((dec /= 10) > 0); cannam@226: cannam@226: *s++ = '.'; cannam@226: cannam@226: // Write fractional part (right to left) cannam@226: double frac_part = fabs(d - int_part); cannam@226: if (frac_part < DBL_EPSILON) { cannam@226: *s++ = '0'; cannam@226: node.n_bytes = node.n_chars = (s - buf); cannam@226: } else { cannam@226: uint64_t frac = frac_part * pow(10.0, (int)frac_digits) + 0.5; cannam@226: s += frac_digits - 1; cannam@226: unsigned i = 0; cannam@226: cannam@226: // Skip trailing zeros cannam@226: for (; i < frac_digits - 1 && !(frac % 10); ++i, --s, frac /= 10) {} cannam@226: cannam@226: node.n_bytes = node.n_chars = (s - buf) + 1; cannam@226: cannam@226: // Write digits from last trailing zero to decimal point cannam@226: for (; i < frac_digits; ++i) { cannam@226: *s-- = '0' + (frac % 10); cannam@226: frac /= 10; cannam@226: } cannam@226: } cannam@226: cannam@226: return node; cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_new_integer(int64_t i) cannam@226: { cannam@226: int64_t abs_i = (i < 0) ? -i : i; cannam@226: const unsigned digits = serd_digits(abs_i); cannam@226: char* buf = (char*)calloc(digits + 2, 1); cannam@226: SerdNode node = { (const uint8_t*)buf, 0, 0, 0, SERD_LITERAL }; cannam@226: cannam@226: // Point s to the end cannam@226: char* s = buf + digits - 1; cannam@226: if (i < 0) { cannam@226: *buf = '-'; cannam@226: ++s; cannam@226: } cannam@226: cannam@226: node.n_bytes = node.n_chars = (s - buf) + 1; cannam@226: cannam@226: // Write integer part (right to left) cannam@226: do { cannam@226: *s-- = '0' + (abs_i % 10); cannam@226: } while ((abs_i /= 10) > 0); cannam@226: cannam@226: return node; cannam@226: } cannam@226: cannam@226: /** cannam@226: Base64 encoding table. cannam@226: @see RFC3986 S3. cannam@226: */ cannam@226: static const uint8_t b64_map[] = cannam@226: "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/"; cannam@226: cannam@226: /** cannam@226: Encode 3 raw bytes to 4 base64 characters. cannam@226: */ cannam@226: static inline void cannam@226: encode_chunk(uint8_t out[4], const uint8_t in[3], size_t n_in) cannam@226: { cannam@226: out[0] = b64_map[in[0] >> 2]; cannam@226: out[1] = b64_map[((in[0] & 0x03) << 4) | ((in[1] & 0xF0) >> 4)]; cannam@226: out[2] = ((n_in > 1) cannam@226: ? (b64_map[((in[1] & 0x0F) << 2) | ((in[2] & 0xC0) >> 6)]) cannam@226: : (uint8_t)'='); cannam@226: out[3] = ((n_in > 2) ? b64_map[in[2] & 0x3F] : (uint8_t)'='); cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: SerdNode cannam@226: serd_node_new_blob(const void* buf, size_t size, bool wrap_lines) cannam@226: { cannam@226: const size_t len = ((size + 2) / 3) * 4 + (wrap_lines ? (size / 57) : 0); cannam@226: uint8_t* str = (uint8_t*)calloc(1, len + 2); cannam@226: SerdNode node = { str, len, len, 0, SERD_LITERAL }; cannam@226: for (size_t i = 0, j = 0; i < size; i += 3, j += 4) { cannam@226: uint8_t in[4] = { 0, 0, 0, 0 }; cannam@226: size_t n_in = MIN(3, size - i); cannam@226: memcpy(in, (const uint8_t*)buf + i, n_in); cannam@226: cannam@226: if (wrap_lines && i > 0 && (i % 57) == 0) { cannam@226: str[j++] = '\n'; cannam@226: node.flags |= SERD_HAS_NEWLINE; cannam@226: } cannam@226: cannam@226: encode_chunk(str + j, in, n_in); cannam@226: } cannam@226: return node; cannam@226: } cannam@226: cannam@226: SERD_API cannam@226: void cannam@226: serd_node_free(SerdNode* node) cannam@226: { cannam@226: if (node && node->buf) { cannam@226: free((uint8_t*)node->buf); cannam@226: node->buf = NULL; cannam@226: } cannam@226: }