cannam@49: // Copyright (c) 2013-2014 Sandstorm Development Group, Inc. and contributors
cannam@49: // Licensed under the MIT License:
cannam@49: //
cannam@49: // Permission is hereby granted, free of charge, to any person obtaining a copy
cannam@49: // of this software and associated documentation files (the "Software"), to deal
cannam@49: // in the Software without restriction, including without limitation the rights
cannam@49: // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
cannam@49: // copies of the Software, and to permit persons to whom the Software is
cannam@49: // furnished to do so, subject to the following conditions:
cannam@49: //
cannam@49: // The above copyright notice and this permission notice shall be included in
cannam@49: // all copies or substantial portions of the Software.
cannam@49: //
cannam@49: // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
cannam@49: // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
cannam@49: // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
cannam@49: // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
cannam@49: // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
cannam@49: // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
cannam@49: // THE SOFTWARE.
cannam@49: 
cannam@49: #ifndef CAPNP_SCHEMA_PARSER_H_
cannam@49: #define CAPNP_SCHEMA_PARSER_H_
cannam@49: 
cannam@49: #if defined(__GNUC__) && !defined(CAPNP_HEADER_WARNINGS)
cannam@49: #pragma GCC system_header
cannam@49: #endif
cannam@49: 
cannam@49: #include "schema-loader.h"
cannam@49: #include <kj/string.h>
cannam@49: 
cannam@49: namespace capnp {
cannam@49: 
cannam@49: class ParsedSchema;
cannam@49: class SchemaFile;
cannam@49: 
cannam@49: class SchemaParser {
cannam@49:   // Parses `.capnp` files to produce `Schema` objects.
cannam@49:   //
cannam@49:   // This class is thread-safe, hence all its methods are const.
cannam@49: 
cannam@49: public:
cannam@49:   SchemaParser();
cannam@49:   ~SchemaParser() noexcept(false);
cannam@49: 
cannam@49:   ParsedSchema parseDiskFile(kj::StringPtr displayName, kj::StringPtr diskPath,
cannam@49:                              kj::ArrayPtr<const kj::StringPtr> importPath) const;
cannam@49:   // Parse a file located on disk.  Throws an exception if the file dosen't exist.
cannam@49:   //
cannam@49:   // Parameters:
cannam@49:   // * `displayName`:  The name that will appear in the file's schema node.  (If the file has
cannam@49:   //   already been parsed, this will be ignored and the display name from the first time it was
cannam@49:   //   parsed will be kept.)
cannam@49:   // * `diskPath`:  The path to the file on disk.
cannam@49:   // * `importPath`:  Directories to search when resolving absolute imports within this file
cannam@49:   //   (imports that start with a `/`).  Must remain valid until the SchemaParser is destroyed.
cannam@49:   //   (If the file has already been parsed, this will be ignored and the import path from the
cannam@49:   //   first time it was parsed will be kept.)
cannam@49:   //
cannam@49:   // This method is a shortcut, equivalent to:
cannam@49:   //     parser.parseFile(SchemaFile::newDiskFile(displayName, diskPath, importPath))`;
cannam@49:   //
cannam@49:   // This method throws an exception if any errors are encountered in the file or in anything the
cannam@49:   // file depends on.  Note that merely importing another file does not count as a dependency on
cannam@49:   // anything in the imported file -- only the imported types which are actually used are
cannam@49:   // "dependencies".
cannam@49: 
cannam@49:   ParsedSchema parseFile(kj::Own<SchemaFile>&& file) const;
cannam@49:   // Advanced interface for parsing a file that may or may not be located in any global namespace.
cannam@49:   // Most users will prefer `parseDiskFile()`.
cannam@49:   //
cannam@49:   // If the file has already been parsed (that is, a SchemaFile that compares equal to this one
cannam@49:   // was parsed previously), the existing schema will be returned again.
cannam@49:   //
cannam@49:   // This method reports errors by calling SchemaFile::reportError() on the file where the error
cannam@49:   // is located.  If that call does not throw an exception, `parseFile()` may in fact return
cannam@49:   // normally.  In this case, the result is a best-effort attempt to compile the schema, but it
cannam@49:   // may be invalid or corrupt, and using it for anything may cause exceptions to be thrown.
cannam@49: 
cannam@49:   template <typename T>
cannam@49:   inline void loadCompiledTypeAndDependencies() {
cannam@49:     // See SchemaLoader::loadCompiledTypeAndDependencies().
cannam@49:     getLoader().loadCompiledTypeAndDependencies<T>();
cannam@49:   }
cannam@49: 
cannam@49: private:
cannam@49:   struct Impl;
cannam@49:   class ModuleImpl;
cannam@49:   kj::Own<Impl> impl;
cannam@49:   mutable bool hadErrors = false;
cannam@49: 
cannam@49:   ModuleImpl& getModuleImpl(kj::Own<SchemaFile>&& file) const;
cannam@49:   SchemaLoader& getLoader();
cannam@49: 
cannam@49:   friend class ParsedSchema;
cannam@49: };
cannam@49: 
cannam@49: class ParsedSchema: public Schema {
cannam@49:   // ParsedSchema is an extension of Schema which also has the ability to look up nested nodes
cannam@49:   // by name.  See `SchemaParser`.
cannam@49: 
cannam@49: public:
cannam@49:   inline ParsedSchema(): parser(nullptr) {}
cannam@49: 
cannam@49:   kj::Maybe<ParsedSchema> findNested(kj::StringPtr name) const;
cannam@49:   // Gets the nested node with the given name, or returns null if there is no such nested
cannam@49:   // declaration.
cannam@49: 
cannam@49:   ParsedSchema getNested(kj::StringPtr name) const;
cannam@49:   // Gets the nested node with the given name, or throws an exception if there is no such nested
cannam@49:   // declaration.
cannam@49: 
cannam@49: private:
cannam@49:   inline ParsedSchema(Schema inner, const SchemaParser& parser): Schema(inner), parser(&parser) {}
cannam@49: 
cannam@49:   const SchemaParser* parser;
cannam@49:   friend class SchemaParser;
cannam@49: };
cannam@49: 
cannam@49: // =======================================================================================
cannam@49: // Advanced API
cannam@49: 
cannam@49: class SchemaFile {
cannam@49:   // Abstract interface representing a schema file.  You can implement this yourself in order to
cannam@49:   // gain more control over how the compiler resolves imports and reads files.  For the
cannam@49:   // common case of files on disk or other global filesystem-like namespaces, use
cannam@49:   // `SchemaFile::newDiskFile()`.
cannam@49: 
cannam@49: public:
cannam@49:   class FileReader {
cannam@49:   public:
cannam@49:     virtual bool exists(kj::StringPtr path) const = 0;
cannam@49:     virtual kj::Array<const char> read(kj::StringPtr path) const = 0;
cannam@49:   };
cannam@49: 
cannam@49:   class DiskFileReader final: public FileReader {
cannam@49:     // Implementation of FileReader that uses the local disk.  Files are read using mmap() if
cannam@49:     // possible.
cannam@49: 
cannam@49:   public:
cannam@49:     static const DiskFileReader instance;
cannam@49: 
cannam@49:     bool exists(kj::StringPtr path) const override;
cannam@49:     kj::Array<const char> read(kj::StringPtr path) const override;
cannam@49:   };
cannam@49: 
cannam@49:   static kj::Own<SchemaFile> newDiskFile(
cannam@49:       kj::StringPtr displayName, kj::StringPtr diskPath,
cannam@49:       kj::ArrayPtr<const kj::StringPtr> importPath,
cannam@49:       const FileReader& fileReader = DiskFileReader::instance);
cannam@49:   // Construct a SchemaFile representing a file on disk (or located in the filesystem-like
cannam@49:   // namespace represented by `fileReader`).
cannam@49:   //
cannam@49:   // Parameters:
cannam@49:   // * `displayName`:  The name that will appear in the file's schema node.
cannam@49:   // * `diskPath`:  The path to the file on disk.
cannam@49:   // * `importPath`:  Directories to search when resolving absolute imports within this file
cannam@49:   //   (imports that start with a `/`).  The array content must remain valid as long as the
cannam@49:   //   SchemaFile exists (which is at least as long as the SchemaParser that parses it exists).
cannam@49:   // * `fileReader`:  Allows you to use a filesystem other than the actual local disk.  Although,
cannam@49:   //   if you find yourself using this, it may make more sense for you to implement SchemaFile
cannam@49:   //   yourself.
cannam@49:   //
cannam@49:   // The SchemaFile compares equal to any other SchemaFile that has exactly the same disk path,
cannam@49:   // after canonicalization.
cannam@49:   //
cannam@49:   // The SchemaFile will throw an exception if any errors are reported.
cannam@49: 
cannam@49:   // -----------------------------------------------------------------
cannam@49:   // For more control, you can implement this interface.
cannam@49: 
cannam@49:   virtual kj::StringPtr getDisplayName() const = 0;
cannam@49:   // Get the file's name, as it should appear in the schema.
cannam@49: 
cannam@49:   virtual kj::Array<const char> readContent() const = 0;
cannam@49:   // Read the file's entire content and return it as a byte array.
cannam@49: 
cannam@49:   virtual kj::Maybe<kj::Own<SchemaFile>> import(kj::StringPtr path) const = 0;
cannam@49:   // Resolve an import, relative to this file.
cannam@49:   //
cannam@49:   // `path` is exactly what appears between quotes after the `import` keyword in the source code.
cannam@49:   // It is entirely up to the `SchemaFile` to decide how to map this to another file.  Typically,
cannam@49:   // a leading '/' means that the file is an "absolute" path and is searched for in some list of
cannam@49:   // schema file repositories.  On the other hand, a path that doesn't start with '/' is relative
cannam@49:   // to the importing file.
cannam@49: 
cannam@49:   virtual bool operator==(const SchemaFile& other) const = 0;
cannam@49:   virtual bool operator!=(const SchemaFile& other) const = 0;
cannam@49:   virtual size_t hashCode() const = 0;
cannam@49:   // Compare two SchemaFiles to see if they refer to the same underlying file.  This is an
cannam@49:   // optimization used to avoid the need to re-parse a file to check its ID.
cannam@49: 
cannam@49:   struct SourcePos {
cannam@49:     uint byte;
cannam@49:     uint line;
cannam@49:     uint column;
cannam@49:   };
cannam@49:   virtual void reportError(SourcePos start, SourcePos end, kj::StringPtr message) const = 0;
cannam@49:   // Report that the file contains an error at the given interval.
cannam@49: 
cannam@49: private:
cannam@49:   class DiskSchemaFile;
cannam@49: };
cannam@49: 
cannam@49: }  // namespace capnp
cannam@49: 
cannam@49: #endif  // CAPNP_SCHEMA_PARSER_H_