cannam@132: // Copyright (c) 2013-2014 Sandstorm Development Group, Inc. and contributors cannam@132: // Licensed under the MIT License: cannam@132: // cannam@132: // Permission is hereby granted, free of charge, to any person obtaining a copy cannam@132: // of this software and associated documentation files (the "Software"), to deal cannam@132: // in the Software without restriction, including without limitation the rights cannam@132: // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell cannam@132: // copies of the Software, and to permit persons to whom the Software is cannam@132: // furnished to do so, subject to the following conditions: cannam@132: // cannam@132: // The above copyright notice and this permission notice shall be included in cannam@132: // all copies or substantial portions of the Software. cannam@132: // cannam@132: // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR cannam@132: // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, cannam@132: // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE cannam@132: // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER cannam@132: // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, cannam@132: // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN cannam@132: // THE SOFTWARE. cannam@132: cannam@132: #ifndef KJ_ASYNC_IO_H_ cannam@132: #define KJ_ASYNC_IO_H_ cannam@132: cannam@132: #if defined(__GNUC__) && !KJ_HEADER_WARNINGS cannam@132: #pragma GCC system_header cannam@132: #endif cannam@132: cannam@132: #include "async.h" cannam@132: #include "function.h" cannam@132: #include "thread.h" cannam@132: #include "time.h" cannam@132: cannam@132: struct sockaddr; cannam@132: cannam@132: namespace kj { cannam@132: cannam@132: class UnixEventPort; cannam@132: class NetworkAddress; cannam@132: cannam@132: // ======================================================================================= cannam@132: // Streaming I/O cannam@132: cannam@132: class AsyncInputStream { cannam@132: // Asynchronous equivalent of InputStream (from io.h). cannam@132: cannam@132: public: cannam@132: virtual Promise read(void* buffer, size_t minBytes, size_t maxBytes) = 0; cannam@132: virtual Promise tryRead(void* buffer, size_t minBytes, size_t maxBytes) = 0; cannam@132: cannam@132: Promise read(void* buffer, size_t bytes); cannam@132: }; cannam@132: cannam@132: class AsyncOutputStream { cannam@132: // Asynchronous equivalent of OutputStream (from io.h). cannam@132: cannam@132: public: cannam@132: virtual Promise write(const void* buffer, size_t size) = 0; cannam@132: virtual Promise write(ArrayPtr> pieces) = 0; cannam@132: }; cannam@132: cannam@132: class AsyncIoStream: public AsyncInputStream, public AsyncOutputStream { cannam@132: // A combination input and output stream. cannam@132: cannam@132: public: cannam@132: virtual void shutdownWrite() = 0; cannam@132: // Cleanly shut down just the write end of the stream, while keeping the read end open. cannam@132: cannam@132: virtual void abortRead() {} cannam@132: // Similar to shutdownWrite, but this will shut down the read end of the stream, and should only cannam@132: // be called when an error has occurred. cannam@132: cannam@132: virtual void getsockopt(int level, int option, void* value, uint* length); cannam@132: virtual void setsockopt(int level, int option, const void* value, uint length); cannam@132: // Corresponds to getsockopt() and setsockopt() syscalls. Will throw an "unimplemented" exception cannam@132: // if the stream is not a socket or the option is not appropriate for the socket type. The cannam@132: // default implementations always throw "unimplemented". cannam@132: cannam@132: virtual void getsockname(struct sockaddr* addr, uint* length); cannam@132: virtual void getpeername(struct sockaddr* addr, uint* length); cannam@132: // Corresponds to getsockname() and getpeername() syscalls. Will throw an "unimplemented" cannam@132: // exception if the stream is not a socket. The default implementations always throw cannam@132: // "unimplemented". cannam@132: // cannam@132: // Note that we don't provide methods that return NetworkAddress because it usually wouldn't cannam@132: // be useful. You can't connect() to or listen() on these addresses, obviously, because they are cannam@132: // ephemeral addresses for a single connection. cannam@132: }; cannam@132: cannam@132: struct OneWayPipe { cannam@132: // A data pipe with an input end and an output end. (Typically backed by pipe() system call.) cannam@132: cannam@132: Own in; cannam@132: Own out; cannam@132: }; cannam@132: cannam@132: struct TwoWayPipe { cannam@132: // A data pipe that supports sending in both directions. Each end's output sends data to the cannam@132: // other end's input. (Typically backed by socketpair() system call.) cannam@132: cannam@132: Own ends[2]; cannam@132: }; cannam@132: cannam@132: class ConnectionReceiver { cannam@132: // Represents a server socket listening on a port. cannam@132: cannam@132: public: cannam@132: virtual Promise> accept() = 0; cannam@132: // Accept the next incoming connection. cannam@132: cannam@132: virtual uint getPort() = 0; cannam@132: // Gets the port number, if applicable (i.e. if listening on IP). This is useful if you didn't cannam@132: // specify a port when constructing the NetworkAddress -- one will have been assigned cannam@132: // automatically. cannam@132: cannam@132: virtual void getsockopt(int level, int option, void* value, uint* length); cannam@132: virtual void setsockopt(int level, int option, const void* value, uint length); cannam@132: // Same as the methods of AsyncIoStream. cannam@132: }; cannam@132: cannam@132: // ======================================================================================= cannam@132: // Datagram I/O cannam@132: cannam@132: class AncillaryMessage { cannam@132: // Represents an ancillary message (aka control message) received using the recvmsg() system cannam@132: // call (or equivalent). Most apps will not use this. cannam@132: cannam@132: public: cannam@132: inline AncillaryMessage(int level, int type, ArrayPtr data); cannam@132: AncillaryMessage() = default; cannam@132: cannam@132: inline int getLevel() const; cannam@132: // Originating protocol / socket level. cannam@132: cannam@132: inline int getType() const; cannam@132: // Protocol-specific message type. cannam@132: cannam@132: template cannam@132: inline Maybe as(); cannam@132: // Interpret the ancillary message as the given struct type. Most ancillary messages are some cannam@132: // sort of struct, so this is a convenient way to access it. Returns nullptr if the message cannam@132: // is smaller than the struct -- this can happen if the message was truncated due to cannam@132: // insufficient ancillary buffer space. cannam@132: cannam@132: template cannam@132: inline ArrayPtr asArray(); cannam@132: // Interpret the ancillary message as an array of items. If the message size does not evenly cannam@132: // divide into elements of type T, the remainder is discarded -- this can happen if the message cannam@132: // was truncated due to insufficient ancillary buffer space. cannam@132: cannam@132: private: cannam@132: int level; cannam@132: int type; cannam@132: ArrayPtr data; cannam@132: // Message data. In most cases you should use `as()` or `asArray()`. cannam@132: }; cannam@132: cannam@132: class DatagramReceiver { cannam@132: // Class encapsulating the recvmsg() system call. You must specify the DatagramReceiver's cannam@132: // capacity in advance; if a received packet is larger than the capacity, it will be truncated. cannam@132: cannam@132: public: cannam@132: virtual Promise receive() = 0; cannam@132: // Receive a new message, overwriting this object's content. cannam@132: // cannam@132: // receive() may reuse the same buffers for content and ancillary data with each call. cannam@132: cannam@132: template cannam@132: struct MaybeTruncated { cannam@132: T value; cannam@132: cannam@132: bool isTruncated; cannam@132: // True if the Receiver's capacity was insufficient to receive the value and therefore the cannam@132: // value is truncated. cannam@132: }; cannam@132: cannam@132: virtual MaybeTruncated> getContent() = 0; cannam@132: // Get the content of the datagram. cannam@132: cannam@132: virtual MaybeTruncated> getAncillary() = 0; cannam@132: // Ancilarry messages received with the datagram. See the recvmsg() system call and the cmsghdr cannam@132: // struct. Most apps don't need this. cannam@132: // cannam@132: // If the returned value is truncated, then the last message in the array may itself be cannam@132: // truncated, meaning its as() method will return nullptr or its asArray() method will cannam@132: // return fewer elements than expected. Truncation can also mean that additional messages were cannam@132: // available but discarded. cannam@132: cannam@132: virtual NetworkAddress& getSource() = 0; cannam@132: // Get the datagram sender's address. cannam@132: cannam@132: struct Capacity { cannam@132: size_t content = 8192; cannam@132: // How much space to allocate for the datagram content. If a datagram is received that is cannam@132: // larger than this, it will be truncated, with no way to recover the tail. cannam@132: cannam@132: size_t ancillary = 0; cannam@132: // How much space to allocate for ancillary messages. As with content, if the ancillary data cannam@132: // is larger than this, it will be truncated. cannam@132: }; cannam@132: }; cannam@132: cannam@132: class DatagramPort { cannam@132: public: cannam@132: virtual Promise send(const void* buffer, size_t size, NetworkAddress& destination) = 0; cannam@132: virtual Promise send(ArrayPtr> pieces, cannam@132: NetworkAddress& destination) = 0; cannam@132: cannam@132: virtual Own makeReceiver( cannam@132: DatagramReceiver::Capacity capacity = DatagramReceiver::Capacity()) = 0; cannam@132: // Create a new `Receiver` that can be used to receive datagrams. `capacity` specifies how much cannam@132: // space to allocate for the received message. The `DatagramPort` must outlive the `Receiver`. cannam@132: cannam@132: virtual uint getPort() = 0; cannam@132: // Gets the port number, if applicable (i.e. if listening on IP). This is useful if you didn't cannam@132: // specify a port when constructing the NetworkAddress -- one will have been assigned cannam@132: // automatically. cannam@132: cannam@132: virtual void getsockopt(int level, int option, void* value, uint* length); cannam@132: virtual void setsockopt(int level, int option, const void* value, uint length); cannam@132: // Same as the methods of AsyncIoStream. cannam@132: }; cannam@132: cannam@132: // ======================================================================================= cannam@132: // Networks cannam@132: cannam@132: class NetworkAddress { cannam@132: // Represents a remote address to which the application can connect. cannam@132: cannam@132: public: cannam@132: virtual Promise> connect() = 0; cannam@132: // Make a new connection to this address. cannam@132: // cannam@132: // The address must not be a wildcard ("*"). If it is an IP address, it must have a port number. cannam@132: cannam@132: virtual Own listen() = 0; cannam@132: // Listen for incoming connections on this address. cannam@132: // cannam@132: // The address must be local. cannam@132: cannam@132: virtual Own bindDatagramPort(); cannam@132: // Open this address as a datagram (e.g. UDP) port. cannam@132: // cannam@132: // The address must be local. cannam@132: cannam@132: virtual Own clone() = 0; cannam@132: // Returns an equivalent copy of this NetworkAddress. cannam@132: cannam@132: virtual String toString() = 0; cannam@132: // Produce a human-readable string which hopefully can be passed to Network::parseAddress() cannam@132: // to reproduce this address, although whether or not that works of course depends on the Network cannam@132: // implementation. This should be called only to display the address to human users, who will cannam@132: // hopefully know what they are able to do with it. cannam@132: }; cannam@132: cannam@132: class Network { cannam@132: // Factory for NetworkAddress instances, representing the network services offered by the cannam@132: // operating system. cannam@132: // cannam@132: // This interface typically represents broad authority, and well-designed code should limit its cannam@132: // use to high-level startup code and user interaction. Low-level APIs should accept cannam@132: // NetworkAddress instances directly and work from there, if at all possible. cannam@132: cannam@132: public: cannam@132: virtual Promise> parseAddress(StringPtr addr, uint portHint = 0) = 0; cannam@132: // Construct a network address from a user-provided string. The format of the address cannam@132: // strings is not specified at the API level, and application code should make no assumptions cannam@132: // about them. These strings should always be provided by humans, and said humans will know cannam@132: // what format to use in their particular context. cannam@132: // cannam@132: // `portHint`, if provided, specifies the "standard" IP port number for the application-level cannam@132: // service in play. If the address turns out to be an IP address (v4 or v6), and it lacks a cannam@132: // port number, this port will be used. If `addr` lacks a port number *and* `portHint` is cannam@132: // omitted, then the returned address will only support listen() and bindDatagramPort() cannam@132: // (not connect()), and an unused port will be chosen each time one of those methods is called. cannam@132: cannam@132: virtual Own getSockaddr(const void* sockaddr, uint len) = 0; cannam@132: // Construct a network address from a legacy struct sockaddr. cannam@132: }; cannam@132: cannam@132: // ======================================================================================= cannam@132: // I/O Provider cannam@132: cannam@132: class AsyncIoProvider { cannam@132: // Class which constructs asynchronous wrappers around the operating system's I/O facilities. cannam@132: // cannam@132: // Generally, the implementation of this interface must integrate closely with a particular cannam@132: // `EventLoop` implementation. Typically, the EventLoop implementation itself will provide cannam@132: // an AsyncIoProvider. cannam@132: cannam@132: public: cannam@132: virtual OneWayPipe newOneWayPipe() = 0; cannam@132: // Creates an input/output stream pair representing the ends of a one-way pipe (e.g. created with cannam@132: // the pipe(2) system call). cannam@132: cannam@132: virtual TwoWayPipe newTwoWayPipe() = 0; cannam@132: // Creates two AsyncIoStreams representing the two ends of a two-way pipe (e.g. created with cannam@132: // socketpair(2) system call). Data written to one end can be read from the other. cannam@132: cannam@132: virtual Network& getNetwork() = 0; cannam@132: // Creates a new `Network` instance representing the networks exposed by the operating system. cannam@132: // cannam@132: // DO NOT CALL THIS except at the highest levels of your code, ideally in the main() function. If cannam@132: // you call this from low-level code, then you are preventing higher-level code from injecting an cannam@132: // alternative implementation. Instead, if your code needs to use network functionality, it cannam@132: // should ask for a `Network` as a constructor or method parameter, so that higher-level code can cannam@132: // chose what implementation to use. The system network is essentially a singleton. See: cannam@132: // http://www.object-oriented-security.org/lets-argue/singletons cannam@132: // cannam@132: // Code that uses the system network should not make any assumptions about what kinds of cannam@132: // addresses it will parse, as this could differ across platforms. String addresses should come cannam@132: // strictly from the user, who will know how to write them correctly for their system. cannam@132: // cannam@132: // With that said, KJ currently supports the following string address formats: cannam@132: // - IPv4: "1.2.3.4", "1.2.3.4:80" cannam@132: // - IPv6: "1234:5678::abcd", "[1234:5678::abcd]:80" cannam@132: // - Local IP wildcard (covers both v4 and v6): "*", "*:80" cannam@132: // - Symbolic names: "example.com", "example.com:80", "example.com:http", "1.2.3.4:http" cannam@132: // - Unix domain: "unix:/path/to/socket" cannam@132: cannam@132: struct PipeThread { cannam@132: // A combination of a thread and a two-way pipe that communicates with that thread. cannam@132: // cannam@132: // The fields are intentionally ordered so that the pipe will be destroyed (and therefore cannam@132: // disconnected) before the thread is destroyed (and therefore joined). Thus if the thread cannam@132: // arranges to exit when it detects disconnect, destruction should be clean. cannam@132: cannam@132: Own thread; cannam@132: Own pipe; cannam@132: }; cannam@132: cannam@132: virtual PipeThread newPipeThread( cannam@132: Function startFunc) = 0; cannam@132: // Create a new thread and set up a two-way pipe (socketpair) which can be used to communicate cannam@132: // with it. One end of the pipe is passed to the thread's start function and the other end of cannam@132: // the pipe is returned. The new thread also gets its own `AsyncIoProvider` instance and will cannam@132: // already have an active `EventLoop` when `startFunc` is called. cannam@132: // cannam@132: // TODO(someday): I'm not entirely comfortable with this interface. It seems to be doing too cannam@132: // much at once but I'm not sure how to cleanly break it down. cannam@132: cannam@132: virtual Timer& getTimer() = 0; cannam@132: // Returns a `Timer` based on real time. Time does not pass while event handlers are running -- cannam@132: // it only updates when the event loop polls for system events. This means that calling `now()` cannam@132: // on this timer does not require a system call. cannam@132: // cannam@132: // This timer is not affected by changes to the system date. It is unspecified whether the timer cannam@132: // continues to count while the system is suspended. cannam@132: }; cannam@132: cannam@132: class LowLevelAsyncIoProvider { cannam@132: // Similar to `AsyncIoProvider`, but represents a lower-level interface that may differ on cannam@132: // different operating systems. You should prefer to use `AsyncIoProvider` over this interface cannam@132: // whenever possible, as `AsyncIoProvider` is portable and friendlier to dependency-injection. cannam@132: // cannam@132: // On Unix, this interface can be used to import native file descriptors into the async framework. cannam@132: // Different implementations of this interface might work on top of different event handling cannam@132: // primitives, such as poll vs. epoll vs. kqueue vs. some higher-level event library. cannam@132: // cannam@132: // On Windows, this interface can be used to import native HANDLEs into the async framework. cannam@132: // Different implementations of this interface might work on top of different event handling cannam@132: // primitives, such as I/O completion ports vs. completion routines. cannam@132: // cannam@132: // TODO(port): Actually implement Windows support. cannam@132: cannam@132: public: cannam@132: // --------------------------------------------------------------------------- cannam@132: // Unix-specific stuff cannam@132: cannam@132: enum Flags { cannam@132: // Flags controlling how to wrap a file descriptor. cannam@132: cannam@132: TAKE_OWNERSHIP = 1 << 0, cannam@132: // The returned object should own the file descriptor, automatically closing it when destroyed. cannam@132: // The close-on-exec flag will be set on the descriptor if it is not already. cannam@132: // cannam@132: // If this flag is not used, then the file descriptor is not automatically closed and the cannam@132: // close-on-exec flag is not modified. cannam@132: cannam@132: ALREADY_CLOEXEC = 1 << 1, cannam@132: // Indicates that the close-on-exec flag is known already to be set, so need not be set again. cannam@132: // Only relevant when combined with TAKE_OWNERSHIP. cannam@132: // cannam@132: // On Linux, all system calls which yield new file descriptors have flags or variants which cannam@132: // set the close-on-exec flag immediately. Unfortunately, other OS's do not. cannam@132: cannam@132: ALREADY_NONBLOCK = 1 << 2 cannam@132: // Indicates that the file descriptor is known already to be in non-blocking mode, so the flag cannam@132: // need not be set again. Otherwise, all wrap*Fd() methods will enable non-blocking mode cannam@132: // automatically. cannam@132: // cannam@132: // On Linux, all system calls which yield new file descriptors have flags or variants which cannam@132: // enable non-blocking mode immediately. Unfortunately, other OS's do not. cannam@132: }; cannam@132: cannam@132: virtual Own wrapInputFd(int fd, uint flags = 0) = 0; cannam@132: // Create an AsyncInputStream wrapping a file descriptor. cannam@132: // cannam@132: // `flags` is a bitwise-OR of the values of the `Flags` enum. cannam@132: cannam@132: virtual Own wrapOutputFd(int fd, uint flags = 0) = 0; cannam@132: // Create an AsyncOutputStream wrapping a file descriptor. cannam@132: // cannam@132: // `flags` is a bitwise-OR of the values of the `Flags` enum. cannam@132: cannam@132: virtual Own wrapSocketFd(int fd, uint flags = 0) = 0; cannam@132: // Create an AsyncIoStream wrapping a socket file descriptor. cannam@132: // cannam@132: // `flags` is a bitwise-OR of the values of the `Flags` enum. cannam@132: cannam@132: virtual Promise> wrapConnectingSocketFd(int fd, uint flags = 0) = 0; cannam@132: // Create an AsyncIoStream wrapping a socket that is in the process of connecting. The returned cannam@132: // promise should not resolve until connection has completed -- traditionally indicated by the cannam@132: // descriptor becoming writable. cannam@132: // cannam@132: // `flags` is a bitwise-OR of the values of the `Flags` enum. cannam@132: cannam@132: virtual Own wrapListenSocketFd(int fd, uint flags = 0) = 0; cannam@132: // Create an AsyncIoStream wrapping a listen socket file descriptor. This socket should already cannam@132: // have had `bind()` and `listen()` called on it, so it's ready for `accept()`. cannam@132: // cannam@132: // `flags` is a bitwise-OR of the values of the `Flags` enum. cannam@132: cannam@132: virtual Own wrapDatagramSocketFd(int fd, uint flags = 0); cannam@132: cannam@132: virtual Timer& getTimer() = 0; cannam@132: // Returns a `Timer` based on real time. Time does not pass while event handlers are running -- cannam@132: // it only updates when the event loop polls for system events. This means that calling `now()` cannam@132: // on this timer does not require a system call. cannam@132: // cannam@132: // This timer is not affected by changes to the system date. It is unspecified whether the timer cannam@132: // continues to count while the system is suspended. cannam@132: }; cannam@132: cannam@132: Own newAsyncIoProvider(LowLevelAsyncIoProvider& lowLevel); cannam@132: // Make a new AsyncIoProvider wrapping a `LowLevelAsyncIoProvider`. cannam@132: cannam@132: struct AsyncIoContext { cannam@132: Own lowLevelProvider; cannam@132: Own provider; cannam@132: WaitScope& waitScope; cannam@132: cannam@132: UnixEventPort& unixEventPort; cannam@132: // TEMPORARY: Direct access to underlying UnixEventPort, mainly for waiting on signals. This cannam@132: // field will go away at some point when we have a chance to improve these interfaces. cannam@132: }; cannam@132: cannam@132: AsyncIoContext setupAsyncIo(); cannam@132: // Convenience method which sets up the current thread with everything it needs to do async I/O. cannam@132: // The returned objects contain an `EventLoop` which is wrapping an appropriate `EventPort` for cannam@132: // doing I/O on the host system, so everything is ready for the thread to start making async calls cannam@132: // and waiting on promises. cannam@132: // cannam@132: // You would typically call this in your main() loop or in the start function of a thread. cannam@132: // Example: cannam@132: // cannam@132: // int main() { cannam@132: // auto ioContext = kj::setupAsyncIo(); cannam@132: // cannam@132: // // Now we can call an async function. cannam@132: // Promise textPromise = getHttp(*ioContext.provider, "http://example.com"); cannam@132: // cannam@132: // // And we can wait for the promise to complete. Note that you can only use `wait()` cannam@132: // // from the top level, not from inside a promise callback. cannam@132: // String text = textPromise.wait(ioContext.waitScope); cannam@132: // print(text); cannam@132: // return 0; cannam@132: // } cannam@132: // cannam@132: // WARNING: An AsyncIoContext can only be used in the thread and process that created it. In cannam@132: // particular, note that after a fork(), an AsyncIoContext created in the parent process will cannam@132: // not work correctly in the child, even if the parent ceases to use its copy. In particular cannam@132: // note that this means that server processes which daemonize themselves at startup must wait cannam@132: // until after daemonization to create an AsyncIoContext. cannam@132: cannam@132: // ======================================================================================= cannam@132: // inline implementation details cannam@132: cannam@132: inline AncillaryMessage::AncillaryMessage( cannam@132: int level, int type, ArrayPtr data) cannam@132: : level(level), type(type), data(data) {} cannam@132: cannam@132: inline int AncillaryMessage::getLevel() const { return level; } cannam@132: inline int AncillaryMessage::getType() const { return type; } cannam@132: cannam@132: template cannam@132: inline Maybe AncillaryMessage::as() { cannam@132: if (data.size() >= sizeof(T)) { cannam@132: return *reinterpret_cast(data.begin()); cannam@132: } else { cannam@132: return nullptr; cannam@132: } cannam@132: } cannam@132: cannam@132: template cannam@132: inline ArrayPtr AncillaryMessage::asArray() { cannam@132: return arrayPtr(reinterpret_cast(data.begin()), data.size() / sizeof(T)); cannam@132: } cannam@132: cannam@132: } // namespace kj cannam@132: cannam@132: #endif // KJ_ASYNC_IO_H_