annotate win32-mingw/include/capnp/serialize.h @ 159:f4b37539fcc7

Rebuild win32 Opus using mingw 5 rather than 7 to avoid runtime incompatibility
author Chris Cannam <cannam@all-day-breakfast.com>
date Wed, 30 Jan 2019 10:30:56 +0000
parents 279b18cc7785
children
rev   line source
cannam@149 1 // Copyright (c) 2013-2014 Sandstorm Development Group, Inc. and contributors
cannam@149 2 // Licensed under the MIT License:
cannam@149 3 //
cannam@149 4 // Permission is hereby granted, free of charge, to any person obtaining a copy
cannam@149 5 // of this software and associated documentation files (the "Software"), to deal
cannam@149 6 // in the Software without restriction, including without limitation the rights
cannam@149 7 // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
cannam@149 8 // copies of the Software, and to permit persons to whom the Software is
cannam@149 9 // furnished to do so, subject to the following conditions:
cannam@149 10 //
cannam@149 11 // The above copyright notice and this permission notice shall be included in
cannam@149 12 // all copies or substantial portions of the Software.
cannam@149 13 //
cannam@149 14 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
cannam@149 15 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
cannam@149 16 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
cannam@149 17 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
cannam@149 18 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
cannam@149 19 // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
cannam@149 20 // THE SOFTWARE.
cannam@149 21
cannam@149 22 // This file implements a simple serialization format for Cap'n Proto messages. The format
cannam@149 23 // is as follows:
cannam@149 24 //
cannam@149 25 // * 32-bit little-endian segment count (4 bytes).
cannam@149 26 // * 32-bit little-endian size of each segment (4*(segment count) bytes).
cannam@149 27 // * Padding so that subsequent data is 64-bit-aligned (0 or 4 bytes). (I.e., if there are an even
cannam@149 28 // number of segments, there are 4 bytes of zeros here, otherwise there is no padding.)
cannam@149 29 // * Data from each segment, in order (8*sum(segment sizes) bytes)
cannam@149 30 //
cannam@149 31 // This format has some important properties:
cannam@149 32 // - It is self-delimiting, so multiple messages may be written to a stream without any external
cannam@149 33 // delimiter.
cannam@149 34 // - The total size and position of each segment can be determined by reading only the first part
cannam@149 35 // of the message, allowing lazy and random-access reading of the segment data.
cannam@149 36 // - A message is always at least 8 bytes.
cannam@149 37 // - A single-segment message can be read entirely in two system calls with no buffering.
cannam@149 38 // - A multi-segment message can be read entirely in three system calls with no buffering.
cannam@149 39 // - The format is appropriate for mmap()ing since all data is aligned.
cannam@149 40
cannam@149 41 #ifndef CAPNP_SERIALIZE_H_
cannam@149 42 #define CAPNP_SERIALIZE_H_
cannam@149 43
cannam@149 44 #if defined(__GNUC__) && !defined(CAPNP_HEADER_WARNINGS)
cannam@149 45 #pragma GCC system_header
cannam@149 46 #endif
cannam@149 47
cannam@149 48 #include "message.h"
cannam@149 49 #include <kj/io.h>
cannam@149 50
cannam@149 51 namespace capnp {
cannam@149 52
cannam@149 53 class FlatArrayMessageReader: public MessageReader {
cannam@149 54 // Parses a message from a flat array. Note that it makes sense to use this together with mmap()
cannam@149 55 // for extremely fast parsing.
cannam@149 56
cannam@149 57 public:
cannam@149 58 FlatArrayMessageReader(kj::ArrayPtr<const word> array, ReaderOptions options = ReaderOptions());
cannam@149 59 // The array must remain valid until the MessageReader is destroyed.
cannam@149 60
cannam@149 61 kj::ArrayPtr<const word> getSegment(uint id) override;
cannam@149 62
cannam@149 63 const word* getEnd() const { return end; }
cannam@149 64 // Get a pointer just past the end of the message as determined by reading the message header.
cannam@149 65 // This could actually be before the end of the input array. This pointer is useful e.g. if
cannam@149 66 // you know that the input array has extra stuff appended after the message and you want to
cannam@149 67 // get at it.
cannam@149 68
cannam@149 69 private:
cannam@149 70 // Optimize for single-segment case.
cannam@149 71 kj::ArrayPtr<const word> segment0;
cannam@149 72 kj::Array<kj::ArrayPtr<const word>> moreSegments;
cannam@149 73 const word* end;
cannam@149 74 };
cannam@149 75
cannam@149 76 kj::ArrayPtr<const word> initMessageBuilderFromFlatArrayCopy(
cannam@149 77 kj::ArrayPtr<const word> array, MessageBuilder& target,
cannam@149 78 ReaderOptions options = ReaderOptions());
cannam@149 79 // Convenience function which reads a message using `FlatArrayMessageReader` then copies the
cannam@149 80 // content into the target `MessageBuilder`, verifying that the message structure is valid
cannam@149 81 // (although not necessarily that it matches the desired schema).
cannam@149 82 //
cannam@149 83 // Returns an ArrayPtr containing any words left over in the array after consuming the whole
cannam@149 84 // message. This is useful when reading multiple messages that have been concatenated. See also
cannam@149 85 // FlatArrayMessageReader::getEnd().
cannam@149 86 //
cannam@149 87 // (Note that it's also possible to initialize a `MessageBuilder` directly without a copy using one
cannam@149 88 // of `MessageBuilder`'s constructors. However, this approach skips the validation step and is not
cannam@149 89 // safe to use on untrusted input. Therefore, we do not provide a convenience method for it.)
cannam@149 90
cannam@149 91 kj::Array<word> messageToFlatArray(MessageBuilder& builder);
cannam@149 92 // Constructs a flat array containing the entire content of the given message.
cannam@149 93 //
cannam@149 94 // To output the message as bytes, use `.asBytes()` on the returned word array. Keep in mind that
cannam@149 95 // `asBytes()` returns an ArrayPtr, so you have to save the Array as well to prevent it from being
cannam@149 96 // deleted. For example:
cannam@149 97 //
cannam@149 98 // kj::Array<capnp::word> words = messageToFlatArray(myMessage);
cannam@149 99 // kj::ArrayPtr<kj::byte> bytes = words.asBytes();
cannam@149 100 // write(fd, bytes.begin(), bytes.size());
cannam@149 101
cannam@149 102 kj::Array<word> messageToFlatArray(kj::ArrayPtr<const kj::ArrayPtr<const word>> segments);
cannam@149 103 // Version of messageToFlatArray that takes a raw segment array.
cannam@149 104
cannam@149 105 size_t computeSerializedSizeInWords(MessageBuilder& builder);
cannam@149 106 // Returns the size, in words, that will be needed to serialize the message, including the header.
cannam@149 107
cannam@149 108 size_t computeSerializedSizeInWords(kj::ArrayPtr<const kj::ArrayPtr<const word>> segments);
cannam@149 109 // Version of computeSerializedSizeInWords that takes a raw segment array.
cannam@149 110
cannam@149 111 size_t expectedSizeInWordsFromPrefix(kj::ArrayPtr<const word> messagePrefix);
cannam@149 112 // Given a prefix of a serialized message, try to determine the expected total size of the message,
cannam@149 113 // in words. The returned size is based on the information known so far; it may be an underestimate
cannam@149 114 // if the prefix doesn't contain the full segment table.
cannam@149 115 //
cannam@149 116 // If the returned value is greater than `messagePrefix.size()`, then the message is not yet
cannam@149 117 // complete and the app cannot parse it yet. If the returned value is less than or equal to
cannam@149 118 // `messagePrefix.size()`, then the returned value is the exact total size of the message; any
cannam@149 119 // remaining bytes are part of the next message.
cannam@149 120 //
cannam@149 121 // This function is useful when reading messages from a stream in an asynchronous way, but when
cannam@149 122 // using the full KJ async infrastructure would be too difficult. Each time bytes are received,
cannam@149 123 // use this function to determine if an entire message is ready to be parsed.
cannam@149 124
cannam@149 125 // =======================================================================================
cannam@149 126
cannam@149 127 class InputStreamMessageReader: public MessageReader {
cannam@149 128 // A MessageReader that reads from an abstract kj::InputStream. See also StreamFdMessageReader
cannam@149 129 // for a subclass specific to file descriptors.
cannam@149 130
cannam@149 131 public:
cannam@149 132 InputStreamMessageReader(kj::InputStream& inputStream,
cannam@149 133 ReaderOptions options = ReaderOptions(),
cannam@149 134 kj::ArrayPtr<word> scratchSpace = nullptr);
cannam@149 135 ~InputStreamMessageReader() noexcept(false);
cannam@149 136
cannam@149 137 // implements MessageReader ----------------------------------------
cannam@149 138 kj::ArrayPtr<const word> getSegment(uint id) override;
cannam@149 139
cannam@149 140 private:
cannam@149 141 kj::InputStream& inputStream;
cannam@149 142 byte* readPos;
cannam@149 143
cannam@149 144 // Optimize for single-segment case.
cannam@149 145 kj::ArrayPtr<const word> segment0;
cannam@149 146 kj::Array<kj::ArrayPtr<const word>> moreSegments;
cannam@149 147
cannam@149 148 kj::Array<word> ownedSpace;
cannam@149 149 // Only if scratchSpace wasn't big enough.
cannam@149 150
cannam@149 151 kj::UnwindDetector unwindDetector;
cannam@149 152 };
cannam@149 153
cannam@149 154 void readMessageCopy(kj::InputStream& input, MessageBuilder& target,
cannam@149 155 ReaderOptions options = ReaderOptions(),
cannam@149 156 kj::ArrayPtr<word> scratchSpace = nullptr);
cannam@149 157 // Convenience function which reads a message using `InputStreamMessageReader` then copies the
cannam@149 158 // content into the target `MessageBuilder`, verifying that the message structure is valid
cannam@149 159 // (although not necessarily that it matches the desired schema).
cannam@149 160 //
cannam@149 161 // (Note that it's also possible to initialize a `MessageBuilder` directly without a copy using one
cannam@149 162 // of `MessageBuilder`'s constructors. However, this approach skips the validation step and is not
cannam@149 163 // safe to use on untrusted input. Therefore, we do not provide a convenience method for it.)
cannam@149 164
cannam@149 165 void writeMessage(kj::OutputStream& output, MessageBuilder& builder);
cannam@149 166 // Write the message to the given output stream.
cannam@149 167
cannam@149 168 void writeMessage(kj::OutputStream& output, kj::ArrayPtr<const kj::ArrayPtr<const word>> segments);
cannam@149 169 // Write the segment array to the given output stream.
cannam@149 170
cannam@149 171 // =======================================================================================
cannam@149 172 // Specializations for reading from / writing to file descriptors.
cannam@149 173
cannam@149 174 class StreamFdMessageReader: private kj::FdInputStream, public InputStreamMessageReader {
cannam@149 175 // A MessageReader that reads from a steam-based file descriptor.
cannam@149 176
cannam@149 177 public:
cannam@149 178 StreamFdMessageReader(int fd, ReaderOptions options = ReaderOptions(),
cannam@149 179 kj::ArrayPtr<word> scratchSpace = nullptr)
cannam@149 180 : FdInputStream(fd), InputStreamMessageReader(*this, options, scratchSpace) {}
cannam@149 181 // Read message from a file descriptor, without taking ownership of the descriptor.
cannam@149 182
cannam@149 183 StreamFdMessageReader(kj::AutoCloseFd fd, ReaderOptions options = ReaderOptions(),
cannam@149 184 kj::ArrayPtr<word> scratchSpace = nullptr)
cannam@149 185 : FdInputStream(kj::mv(fd)), InputStreamMessageReader(*this, options, scratchSpace) {}
cannam@149 186 // Read a message from a file descriptor, taking ownership of the descriptor.
cannam@149 187
cannam@149 188 ~StreamFdMessageReader() noexcept(false);
cannam@149 189 };
cannam@149 190
cannam@149 191 void readMessageCopyFromFd(int fd, MessageBuilder& target,
cannam@149 192 ReaderOptions options = ReaderOptions(),
cannam@149 193 kj::ArrayPtr<word> scratchSpace = nullptr);
cannam@149 194 // Convenience function which reads a message using `StreamFdMessageReader` then copies the
cannam@149 195 // content into the target `MessageBuilder`, verifying that the message structure is valid
cannam@149 196 // (although not necessarily that it matches the desired schema).
cannam@149 197 //
cannam@149 198 // (Note that it's also possible to initialize a `MessageBuilder` directly without a copy using one
cannam@149 199 // of `MessageBuilder`'s constructors. However, this approach skips the validation step and is not
cannam@149 200 // safe to use on untrusted input. Therefore, we do not provide a convenience method for it.)
cannam@149 201
cannam@149 202 void writeMessageToFd(int fd, MessageBuilder& builder);
cannam@149 203 // Write the message to the given file descriptor.
cannam@149 204 //
cannam@149 205 // This function throws an exception on any I/O error. If your code is not exception-safe, be sure
cannam@149 206 // you catch this exception at the call site. If throwing an exception is not acceptable, you
cannam@149 207 // can implement your own OutputStream with arbitrary error handling and then use writeMessage().
cannam@149 208
cannam@149 209 void writeMessageToFd(int fd, kj::ArrayPtr<const kj::ArrayPtr<const word>> segments);
cannam@149 210 // Write the segment array to the given file descriptor.
cannam@149 211 //
cannam@149 212 // This function throws an exception on any I/O error. If your code is not exception-safe, be sure
cannam@149 213 // you catch this exception at the call site. If throwing an exception is not acceptable, you
cannam@149 214 // can implement your own OutputStream with arbitrary error handling and then use writeMessage().
cannam@149 215
cannam@149 216 // =======================================================================================
cannam@149 217 // inline stuff
cannam@149 218
cannam@149 219 inline kj::Array<word> messageToFlatArray(MessageBuilder& builder) {
cannam@149 220 return messageToFlatArray(builder.getSegmentsForOutput());
cannam@149 221 }
cannam@149 222
cannam@149 223 inline size_t computeSerializedSizeInWords(MessageBuilder& builder) {
cannam@149 224 return computeSerializedSizeInWords(builder.getSegmentsForOutput());
cannam@149 225 }
cannam@149 226
cannam@149 227 inline void writeMessage(kj::OutputStream& output, MessageBuilder& builder) {
cannam@149 228 writeMessage(output, builder.getSegmentsForOutput());
cannam@149 229 }
cannam@149 230
cannam@149 231 inline void writeMessageToFd(int fd, MessageBuilder& builder) {
cannam@149 232 writeMessageToFd(fd, builder.getSegmentsForOutput());
cannam@149 233 }
cannam@149 234
cannam@149 235 } // namespace capnp
cannam@149 236
cannam@149 237 #endif // SERIALIZE_H_