cannam@134: // Copyright (c) 2013-2014 Sandstorm Development Group, Inc. and contributors cannam@134: // Licensed under the MIT License: cannam@134: // cannam@134: // Permission is hereby granted, free of charge, to any person obtaining a copy cannam@134: // of this software and associated documentation files (the "Software"), to deal cannam@134: // in the Software without restriction, including without limitation the rights cannam@134: // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell cannam@134: // copies of the Software, and to permit persons to whom the Software is cannam@134: // furnished to do so, subject to the following conditions: cannam@134: // cannam@134: // The above copyright notice and this permission notice shall be included in cannam@134: // all copies or substantial portions of the Software. cannam@134: // cannam@134: // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR cannam@134: // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, cannam@134: // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE cannam@134: // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER cannam@134: // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, cannam@134: // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN cannam@134: // THE SOFTWARE. cannam@134: cannam@134: #ifndef KJ_STRING_TREE_H_ cannam@134: #define KJ_STRING_TREE_H_ cannam@134: cannam@134: #if defined(__GNUC__) && !KJ_HEADER_WARNINGS cannam@134: #pragma GCC system_header cannam@134: #endif cannam@134: cannam@134: #include "string.h" cannam@134: cannam@134: namespace kj { cannam@134: cannam@134: class StringTree { cannam@134: // A long string, represented internally as a tree of strings. This data structure is like a cannam@134: // String, but optimized for concatenation and iteration at the expense of seek time. The cannam@134: // structure is intended to be used for building large text blobs from many small pieces, where cannam@134: // repeatedly concatenating smaller strings into larger ones would waste copies. This structure cannam@134: // is NOT intended for use cases requiring random access or computing substrings. For those, cannam@134: // you should use a Rope, which is a much more complicated data structure. cannam@134: // cannam@134: // The proper way to construct a StringTree is via kj::strTree(...), which works just like cannam@134: // kj::str(...) but returns a StringTree rather than a String. cannam@134: // cannam@134: // KJ_STRINGIFY() functions that construct large strings from many smaller strings are encouraged cannam@134: // to return StringTree rather than a flat char container. cannam@134: cannam@134: public: cannam@134: inline StringTree(): size_(0) {} cannam@134: inline StringTree(String&& text): size_(text.size()), text(kj::mv(text)) {} cannam@134: cannam@134: StringTree(Array&& pieces, StringPtr delim); cannam@134: // Build a StringTree by concatenating the given pieces, delimited by the given delimiter cannam@134: // (e.g. ", "). cannam@134: cannam@134: inline size_t size() const { return size_; } cannam@134: cannam@134: template cannam@134: void visit(Func&& func) const; cannam@134: cannam@134: String flatten() const; cannam@134: // Return the contents as a string. cannam@134: cannam@134: // TODO(someday): flatten() when *this is an rvalue and when branches.size() == 0 could simply cannam@134: // return `kj::mv(text)`. Requires reference qualifiers (Clang 3.3 / GCC 4.8). cannam@134: cannam@134: void flattenTo(char* __restrict__ target) const; cannam@134: // Copy the contents to the given character array. Does not add a NUL terminator. cannam@134: cannam@134: private: cannam@134: size_t size_; cannam@134: String text; cannam@134: cannam@134: struct Branch; cannam@134: Array branches; // In order. cannam@134: cannam@134: inline void fill(char* pos, size_t branchIndex); cannam@134: template cannam@134: void fill(char* pos, size_t branchIndex, First&& first, Rest&&... rest); cannam@134: template cannam@134: void fill(char* pos, size_t branchIndex, StringTree&& first, Rest&&... rest); cannam@134: template cannam@134: void fill(char* pos, size_t branchIndex, Array&& first, Rest&&... rest); cannam@134: template cannam@134: void fill(char* pos, size_t branchIndex, String&& first, Rest&&... rest); cannam@134: cannam@134: template cannam@134: static StringTree concat(Params&&... params); cannam@134: static StringTree&& concat(StringTree&& param) { return kj::mv(param); } cannam@134: cannam@134: template cannam@134: static inline size_t flatSize(const T& t) { return t.size(); } cannam@134: static inline size_t flatSize(String&& s) { return 0; } cannam@134: static inline size_t flatSize(StringTree&& s) { return 0; } cannam@134: cannam@134: template cannam@134: static inline size_t branchCount(const T& t) { return 0; } cannam@134: static inline size_t branchCount(String&& s) { return 1; } cannam@134: static inline size_t branchCount(StringTree&& s) { return 1; } cannam@134: cannam@134: template cannam@134: friend StringTree strTree(Params&&... params); cannam@134: }; cannam@134: cannam@134: inline StringTree&& KJ_STRINGIFY(StringTree&& tree) { return kj::mv(tree); } cannam@134: inline const StringTree& KJ_STRINGIFY(const StringTree& tree) { return tree; } cannam@134: cannam@134: inline StringTree KJ_STRINGIFY(Array&& trees) { return StringTree(kj::mv(trees), ""); } cannam@134: cannam@134: template cannam@134: StringTree strTree(Params&&... params); cannam@134: // Build a StringTree by stringifying the given parameters and concatenating the results. cannam@134: // If any of the parameters stringify to StringTree rvalues, they will be incorporated as cannam@134: // branches to avoid a copy. cannam@134: cannam@134: // ======================================================================================= cannam@134: // Inline implementation details cannam@134: cannam@134: namespace _ { // private cannam@134: cannam@134: template cannam@134: char* fill(char* __restrict__ target, const StringTree& first, Rest&&... rest) { cannam@134: // Make str() work with stringifiers that return StringTree by patching fill(). cannam@134: cannam@134: first.flattenTo(target); cannam@134: return fill(target + first.size(), kj::fwd(rest)...); cannam@134: } cannam@134: cannam@134: template constexpr bool isStringTree() { return false; } cannam@134: template <> constexpr bool isStringTree() { return true; } cannam@134: cannam@134: inline StringTree&& toStringTreeOrCharSequence(StringTree&& tree) { return kj::mv(tree); } cannam@134: inline StringTree toStringTreeOrCharSequence(String&& str) { return StringTree(kj::mv(str)); } cannam@134: cannam@134: template cannam@134: inline auto toStringTreeOrCharSequence(T&& value) cannam@134: -> decltype(toCharSequence(kj::fwd(value))) { cannam@134: static_assert(!isStringTree>(), cannam@134: "When passing a StringTree into kj::strTree(), either pass it by rvalue " cannam@134: "(use kj::mv(value)) or explicitly call value.flatten() to make a copy."); cannam@134: cannam@134: return toCharSequence(kj::fwd(value)); cannam@134: } cannam@134: cannam@134: } // namespace _ (private) cannam@134: cannam@134: struct StringTree::Branch { cannam@134: size_t index; cannam@134: // Index in `text` where this branch should be inserted. cannam@134: cannam@134: StringTree content; cannam@134: }; cannam@134: cannam@134: template cannam@134: void StringTree::visit(Func&& func) const { cannam@134: size_t pos = 0; cannam@134: for (auto& branch: branches) { cannam@134: if (branch.index > pos) { cannam@134: func(text.slice(pos, branch.index)); cannam@134: pos = branch.index; cannam@134: } cannam@134: branch.content.visit(func); cannam@134: } cannam@134: if (text.size() > pos) { cannam@134: func(text.slice(pos, text.size())); cannam@134: } cannam@134: } cannam@134: cannam@134: inline void StringTree::fill(char* pos, size_t branchIndex) { cannam@134: KJ_IREQUIRE(pos == text.end() && branchIndex == branches.size(), cannam@134: kj::str(text.end() - pos, ' ', branches.size() - branchIndex).cStr()); cannam@134: } cannam@134: cannam@134: template cannam@134: void StringTree::fill(char* pos, size_t branchIndex, First&& first, Rest&&... rest) { cannam@134: pos = _::fill(pos, kj::fwd(first)); cannam@134: fill(pos, branchIndex, kj::fwd(rest)...); cannam@134: } cannam@134: cannam@134: template cannam@134: void StringTree::fill(char* pos, size_t branchIndex, StringTree&& first, Rest&&... rest) { cannam@134: branches[branchIndex].index = pos - text.begin(); cannam@134: branches[branchIndex].content = kj::mv(first); cannam@134: fill(pos, branchIndex + 1, kj::fwd(rest)...); cannam@134: } cannam@134: cannam@134: template cannam@134: void StringTree::fill(char* pos, size_t branchIndex, String&& first, Rest&&... rest) { cannam@134: branches[branchIndex].index = pos - text.begin(); cannam@134: branches[branchIndex].content = StringTree(kj::mv(first)); cannam@134: fill(pos, branchIndex + 1, kj::fwd(rest)...); cannam@134: } cannam@134: cannam@134: template cannam@134: StringTree StringTree::concat(Params&&... params) { cannam@134: StringTree result; cannam@134: result.size_ = _::sum({params.size()...}); cannam@134: result.text = heapString( cannam@134: _::sum({StringTree::flatSize(kj::fwd(params))...})); cannam@134: result.branches = heapArray( cannam@134: _::sum({StringTree::branchCount(kj::fwd(params))...})); cannam@134: result.fill(result.text.begin(), 0, kj::fwd(params)...); cannam@134: return result; cannam@134: } cannam@134: cannam@134: template cannam@134: StringTree strTree(Params&&... params) { cannam@134: return StringTree::concat(_::toStringTreeOrCharSequence(kj::fwd(params))...); cannam@134: } cannam@134: cannam@134: } // namespace kj cannam@134: cannam@134: #endif // KJ_STRING_TREE_H_