annotate json11/json11.cpp @ 75:81e1c48e97f9

Rearrange and rename to Piper C++ structure
author Chris Cannam <c.cannam@qmul.ac.uk>
date Mon, 10 Oct 2016 16:31:09 +0100
parents
children
rev   line source
c@75 1 /* Copyright (c) 2013 Dropbox, Inc.
c@75 2 *
c@75 3 * Permission is hereby granted, free of charge, to any person obtaining a copy
c@75 4 * of this software and associated documentation files (the "Software"), to deal
c@75 5 * in the Software without restriction, including without limitation the rights
c@75 6 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
c@75 7 * copies of the Software, and to permit persons to whom the Software is
c@75 8 * furnished to do so, subject to the following conditions:
c@75 9 *
c@75 10 * The above copyright notice and this permission notice shall be included in
c@75 11 * all copies or substantial portions of the Software.
c@75 12 *
c@75 13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
c@75 14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
c@75 15 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
c@75 16 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
c@75 17 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
c@75 18 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
c@75 19 * THE SOFTWARE.
c@75 20 */
c@75 21
c@75 22 #include "json11.hpp"
c@75 23 #include <cassert>
c@75 24 #include <cmath>
c@75 25 #include <cstdlib>
c@75 26 #include <cstdio>
c@75 27 #include <limits>
c@75 28
c@75 29 namespace json11 {
c@75 30
c@75 31 static const int max_depth = 200;
c@75 32
c@75 33 using std::string;
c@75 34 using std::vector;
c@75 35 using std::map;
c@75 36 using std::make_shared;
c@75 37 using std::initializer_list;
c@75 38 using std::move;
c@75 39
c@75 40 /* * * * * * * * * * * * * * * * * * * *
c@75 41 * Serialization
c@75 42 */
c@75 43
c@75 44 static void dump(std::nullptr_t, string &out) {
c@75 45 out += "null";
c@75 46 }
c@75 47
c@75 48 static void dump(double value, string &out) {
c@75 49 if (std::isfinite(value)) {
c@75 50 char buf[32];
c@75 51 snprintf(buf, sizeof buf, "%.17g", value);
c@75 52 out += buf;
c@75 53 } else {
c@75 54 out += "null";
c@75 55 }
c@75 56 }
c@75 57
c@75 58 static void dump(int value, string &out) {
c@75 59 char buf[32];
c@75 60 snprintf(buf, sizeof buf, "%d", value);
c@75 61 out += buf;
c@75 62 }
c@75 63
c@75 64 static void dump(bool value, string &out) {
c@75 65 out += value ? "true" : "false";
c@75 66 }
c@75 67
c@75 68 static void dump(const string &value, string &out) {
c@75 69 out += '"';
c@75 70 for (size_t i = 0; i < value.length(); i++) {
c@75 71 const char ch = value[i];
c@75 72 if (ch == '\\') {
c@75 73 out += "\\\\";
c@75 74 } else if (ch == '"') {
c@75 75 out += "\\\"";
c@75 76 } else if (ch == '\b') {
c@75 77 out += "\\b";
c@75 78 } else if (ch == '\f') {
c@75 79 out += "\\f";
c@75 80 } else if (ch == '\n') {
c@75 81 out += "\\n";
c@75 82 } else if (ch == '\r') {
c@75 83 out += "\\r";
c@75 84 } else if (ch == '\t') {
c@75 85 out += "\\t";
c@75 86 } else if (static_cast<uint8_t>(ch) <= 0x1f) {
c@75 87 char buf[8];
c@75 88 snprintf(buf, sizeof buf, "\\u%04x", ch);
c@75 89 out += buf;
c@75 90 } else if (static_cast<uint8_t>(ch) == 0xe2 && static_cast<uint8_t>(value[i+1]) == 0x80
c@75 91 && static_cast<uint8_t>(value[i+2]) == 0xa8) {
c@75 92 out += "\\u2028";
c@75 93 i += 2;
c@75 94 } else if (static_cast<uint8_t>(ch) == 0xe2 && static_cast<uint8_t>(value[i+1]) == 0x80
c@75 95 && static_cast<uint8_t>(value[i+2]) == 0xa9) {
c@75 96 out += "\\u2029";
c@75 97 i += 2;
c@75 98 } else {
c@75 99 out += ch;
c@75 100 }
c@75 101 }
c@75 102 out += '"';
c@75 103 }
c@75 104
c@75 105 static void dump(const Json::array &values, string &out) {
c@75 106 bool first = true;
c@75 107 out += "[";
c@75 108 for (const auto &value : values) {
c@75 109 if (!first)
c@75 110 out += ", ";
c@75 111 value.dump(out);
c@75 112 first = false;
c@75 113 }
c@75 114 out += "]";
c@75 115 }
c@75 116
c@75 117 static void dump(const Json::object &values, string &out) {
c@75 118 bool first = true;
c@75 119 out += "{";
c@75 120 for (const auto &kv : values) {
c@75 121 if (!first)
c@75 122 out += ", ";
c@75 123 dump(kv.first, out);
c@75 124 out += ": ";
c@75 125 kv.second.dump(out);
c@75 126 first = false;
c@75 127 }
c@75 128 out += "}";
c@75 129 }
c@75 130
c@75 131 void Json::dump(string &out) const {
c@75 132 m_ptr->dump(out);
c@75 133 }
c@75 134
c@75 135 /* * * * * * * * * * * * * * * * * * * *
c@75 136 * Value wrappers
c@75 137 */
c@75 138
c@75 139 template <Json::Type tag, typename T>
c@75 140 class Value : public JsonValue {
c@75 141 protected:
c@75 142
c@75 143 // Constructors
c@75 144 explicit Value(const T &value) : m_value(value) {}
c@75 145 explicit Value(T &&value) : m_value(move(value)) {}
c@75 146
c@75 147 // Get type tag
c@75 148 Json::Type type() const override {
c@75 149 return tag;
c@75 150 }
c@75 151
c@75 152 // Comparisons
c@75 153 bool equals(const JsonValue * other) const override {
c@75 154 return m_value == static_cast<const Value<tag, T> *>(other)->m_value;
c@75 155 }
c@75 156 bool less(const JsonValue * other) const override {
c@75 157 return m_value < static_cast<const Value<tag, T> *>(other)->m_value;
c@75 158 }
c@75 159
c@75 160 const T m_value;
c@75 161 void dump(string &out) const override { json11::dump(m_value, out); }
c@75 162 };
c@75 163
c@75 164 class JsonDouble final : public Value<Json::NUMBER, double> {
c@75 165 double number_value() const override { return m_value; }
c@75 166 int int_value() const override { return static_cast<int>(m_value); }
c@75 167 bool equals(const JsonValue * other) const override { return m_value == other->number_value(); }
c@75 168 bool less(const JsonValue * other) const override { return m_value < other->number_value(); }
c@75 169 public:
c@75 170 explicit JsonDouble(double value) : Value(value) {}
c@75 171 };
c@75 172
c@75 173 class JsonInt final : public Value<Json::NUMBER, int> {
c@75 174 double number_value() const override { return m_value; }
c@75 175 int int_value() const override { return m_value; }
c@75 176 bool equals(const JsonValue * other) const override { return m_value == other->number_value(); }
c@75 177 bool less(const JsonValue * other) const override { return m_value < other->number_value(); }
c@75 178 public:
c@75 179 explicit JsonInt(int value) : Value(value) {}
c@75 180 };
c@75 181
c@75 182 class JsonBoolean final : public Value<Json::BOOL, bool> {
c@75 183 bool bool_value() const override { return m_value; }
c@75 184 public:
c@75 185 explicit JsonBoolean(bool value) : Value(value) {}
c@75 186 };
c@75 187
c@75 188 class JsonString final : public Value<Json::STRING, string> {
c@75 189 const string &string_value() const override { return m_value; }
c@75 190 public:
c@75 191 explicit JsonString(const string &value) : Value(value) {}
c@75 192 explicit JsonString(string &&value) : Value(move(value)) {}
c@75 193 };
c@75 194
c@75 195 class JsonArray final : public Value<Json::ARRAY, Json::array> {
c@75 196 const Json::array &array_items() const override { return m_value; }
c@75 197 const Json & operator[](size_t i) const override;
c@75 198 public:
c@75 199 explicit JsonArray(const Json::array &value) : Value(value) {}
c@75 200 explicit JsonArray(Json::array &&value) : Value(move(value)) {}
c@75 201 };
c@75 202
c@75 203 class JsonObject final : public Value<Json::OBJECT, Json::object> {
c@75 204 const Json::object &object_items() const override { return m_value; }
c@75 205 const Json & operator[](const string &key) const override;
c@75 206 public:
c@75 207 explicit JsonObject(const Json::object &value) : Value(value) {}
c@75 208 explicit JsonObject(Json::object &&value) : Value(move(value)) {}
c@75 209 };
c@75 210
c@75 211 class JsonNull final : public Value<Json::NUL, std::nullptr_t> {
c@75 212 public:
c@75 213 JsonNull() : Value(nullptr) {}
c@75 214 };
c@75 215
c@75 216 /* * * * * * * * * * * * * * * * * * * *
c@75 217 * Static globals - static-init-safe
c@75 218 */
c@75 219 struct Statics {
c@75 220 const std::shared_ptr<JsonValue> null = make_shared<JsonNull>();
c@75 221 const std::shared_ptr<JsonValue> t = make_shared<JsonBoolean>(true);
c@75 222 const std::shared_ptr<JsonValue> f = make_shared<JsonBoolean>(false);
c@75 223 const string empty_string;
c@75 224 const vector<Json> empty_vector;
c@75 225 const map<string, Json> empty_map;
c@75 226 Statics() {}
c@75 227 };
c@75 228
c@75 229 static const Statics & statics() {
c@75 230 static const Statics s {};
c@75 231 return s;
c@75 232 }
c@75 233
c@75 234 static const Json & static_null() {
c@75 235 // This has to be separate, not in Statics, because Json() accesses statics().null.
c@75 236 static const Json json_null;
c@75 237 return json_null;
c@75 238 }
c@75 239
c@75 240 /* * * * * * * * * * * * * * * * * * * *
c@75 241 * Constructors
c@75 242 */
c@75 243
c@75 244 Json::Json() noexcept : m_ptr(statics().null) {}
c@75 245 Json::Json(std::nullptr_t) noexcept : m_ptr(statics().null) {}
c@75 246 Json::Json(double value) : m_ptr(make_shared<JsonDouble>(value)) {}
c@75 247 Json::Json(int value) : m_ptr(make_shared<JsonInt>(value)) {}
c@75 248 Json::Json(bool value) : m_ptr(value ? statics().t : statics().f) {}
c@75 249 Json::Json(const string &value) : m_ptr(make_shared<JsonString>(value)) {}
c@75 250 Json::Json(string &&value) : m_ptr(make_shared<JsonString>(move(value))) {}
c@75 251 Json::Json(const char * value) : m_ptr(make_shared<JsonString>(value)) {}
c@75 252 Json::Json(const Json::array &values) : m_ptr(make_shared<JsonArray>(values)) {}
c@75 253 Json::Json(Json::array &&values) : m_ptr(make_shared<JsonArray>(move(values))) {}
c@75 254 Json::Json(const Json::object &values) : m_ptr(make_shared<JsonObject>(values)) {}
c@75 255 Json::Json(Json::object &&values) : m_ptr(make_shared<JsonObject>(move(values))) {}
c@75 256
c@75 257 /* * * * * * * * * * * * * * * * * * * *
c@75 258 * Accessors
c@75 259 */
c@75 260
c@75 261 Json::Type Json::type() const { return m_ptr->type(); }
c@75 262 double Json::number_value() const { return m_ptr->number_value(); }
c@75 263 int Json::int_value() const { return m_ptr->int_value(); }
c@75 264 bool Json::bool_value() const { return m_ptr->bool_value(); }
c@75 265 const string & Json::string_value() const { return m_ptr->string_value(); }
c@75 266 const vector<Json> & Json::array_items() const { return m_ptr->array_items(); }
c@75 267 const map<string, Json> & Json::object_items() const { return m_ptr->object_items(); }
c@75 268 const Json & Json::operator[] (size_t i) const { return (*m_ptr)[i]; }
c@75 269 const Json & Json::operator[] (const string &key) const { return (*m_ptr)[key]; }
c@75 270
c@75 271 double JsonValue::number_value() const { return 0; }
c@75 272 int JsonValue::int_value() const { return 0; }
c@75 273 bool JsonValue::bool_value() const { return false; }
c@75 274 const string & JsonValue::string_value() const { return statics().empty_string; }
c@75 275 const vector<Json> & JsonValue::array_items() const { return statics().empty_vector; }
c@75 276 const map<string, Json> & JsonValue::object_items() const { return statics().empty_map; }
c@75 277 const Json & JsonValue::operator[] (size_t) const { return static_null(); }
c@75 278 const Json & JsonValue::operator[] (const string &) const { return static_null(); }
c@75 279
c@75 280 const Json & JsonObject::operator[] (const string &key) const {
c@75 281 auto iter = m_value.find(key);
c@75 282 return (iter == m_value.end()) ? static_null() : iter->second;
c@75 283 }
c@75 284 const Json & JsonArray::operator[] (size_t i) const {
c@75 285 if (i >= m_value.size()) return static_null();
c@75 286 else return m_value[i];
c@75 287 }
c@75 288
c@75 289 /* * * * * * * * * * * * * * * * * * * *
c@75 290 * Comparison
c@75 291 */
c@75 292
c@75 293 bool Json::operator== (const Json &other) const {
c@75 294 if (m_ptr->type() != other.m_ptr->type())
c@75 295 return false;
c@75 296
c@75 297 return m_ptr->equals(other.m_ptr.get());
c@75 298 }
c@75 299
c@75 300 bool Json::operator< (const Json &other) const {
c@75 301 if (m_ptr->type() != other.m_ptr->type())
c@75 302 return m_ptr->type() < other.m_ptr->type();
c@75 303
c@75 304 return m_ptr->less(other.m_ptr.get());
c@75 305 }
c@75 306
c@75 307 /* * * * * * * * * * * * * * * * * * * *
c@75 308 * Parsing
c@75 309 */
c@75 310
c@75 311 /* esc(c)
c@75 312 *
c@75 313 * Format char c suitable for printing in an error message.
c@75 314 */
c@75 315 static inline string esc(char c) {
c@75 316 char buf[12];
c@75 317 if (static_cast<uint8_t>(c) >= 0x20 && static_cast<uint8_t>(c) <= 0x7f) {
c@75 318 snprintf(buf, sizeof buf, "'%c' (%d)", c, c);
c@75 319 } else {
c@75 320 snprintf(buf, sizeof buf, "(%d)", c);
c@75 321 }
c@75 322 return string(buf);
c@75 323 }
c@75 324
c@75 325 static inline bool in_range(long x, long lower, long upper) {
c@75 326 return (x >= lower && x <= upper);
c@75 327 }
c@75 328
c@75 329 /* JsonParser
c@75 330 *
c@75 331 * Object that tracks all state of an in-progress parse.
c@75 332 */
c@75 333 struct JsonParser {
c@75 334
c@75 335 /* State
c@75 336 */
c@75 337 const string &str;
c@75 338 size_t i;
c@75 339 string &err;
c@75 340 bool failed;
c@75 341 const JsonParse strategy;
c@75 342
c@75 343 /* fail(msg, err_ret = Json())
c@75 344 *
c@75 345 * Mark this parse as failed.
c@75 346 */
c@75 347 Json fail(string &&msg) {
c@75 348 return fail(move(msg), Json());
c@75 349 }
c@75 350
c@75 351 template <typename T>
c@75 352 T fail(string &&msg, const T err_ret) {
c@75 353 if (!failed)
c@75 354 err = std::move(msg);
c@75 355 failed = true;
c@75 356 return err_ret;
c@75 357 }
c@75 358
c@75 359 /* consume_whitespace()
c@75 360 *
c@75 361 * Advance until the current character is non-whitespace.
c@75 362 */
c@75 363 void consume_whitespace() {
c@75 364 while (str[i] == ' ' || str[i] == '\r' || str[i] == '\n' || str[i] == '\t')
c@75 365 i++;
c@75 366 }
c@75 367
c@75 368 /* consume_comment()
c@75 369 *
c@75 370 * Advance comments (c-style inline and multiline).
c@75 371 */
c@75 372 bool consume_comment() {
c@75 373 bool comment_found = false;
c@75 374 if (str[i] == '/') {
c@75 375 i++;
c@75 376 if (i == str.size())
c@75 377 return fail("unexpected end of input inside comment", 0);
c@75 378 if (str[i] == '/') { // inline comment
c@75 379 i++;
c@75 380 if (i == str.size())
c@75 381 return fail("unexpected end of input inside inline comment", 0);
c@75 382 // advance until next line
c@75 383 while (str[i] != '\n') {
c@75 384 i++;
c@75 385 if (i == str.size())
c@75 386 return fail("unexpected end of input inside inline comment", 0);
c@75 387 }
c@75 388 comment_found = true;
c@75 389 }
c@75 390 else if (str[i] == '*') { // multiline comment
c@75 391 i++;
c@75 392 if (i > str.size()-2)
c@75 393 return fail("unexpected end of input inside multi-line comment", 0);
c@75 394 // advance until closing tokens
c@75 395 while (!(str[i] == '*' && str[i+1] == '/')) {
c@75 396 i++;
c@75 397 if (i > str.size()-2)
c@75 398 return fail(
c@75 399 "unexpected end of input inside multi-line comment", 0);
c@75 400 }
c@75 401 i += 2;
c@75 402 if (i == str.size())
c@75 403 return fail(
c@75 404 "unexpected end of input inside multi-line comment", 0);
c@75 405 comment_found = true;
c@75 406 }
c@75 407 else
c@75 408 return fail("malformed comment", 0);
c@75 409 }
c@75 410 return comment_found;
c@75 411 }
c@75 412
c@75 413 /* consume_garbage()
c@75 414 *
c@75 415 * Advance until the current character is non-whitespace and non-comment.
c@75 416 */
c@75 417 void consume_garbage() {
c@75 418 consume_whitespace();
c@75 419 if(strategy == JsonParse::COMMENTS) {
c@75 420 bool comment_found = false;
c@75 421 do {
c@75 422 comment_found = consume_comment();
c@75 423 consume_whitespace();
c@75 424 }
c@75 425 while(comment_found);
c@75 426 }
c@75 427 }
c@75 428
c@75 429 /* get_next_token()
c@75 430 *
c@75 431 * Return the next non-whitespace character. If the end of the input is reached,
c@75 432 * flag an error and return 0.
c@75 433 */
c@75 434 char get_next_token() {
c@75 435 consume_garbage();
c@75 436 if (i == str.size())
c@75 437 return fail("unexpected end of input", 0);
c@75 438
c@75 439 return str[i++];
c@75 440 }
c@75 441
c@75 442 /* encode_utf8(pt, out)
c@75 443 *
c@75 444 * Encode pt as UTF-8 and add it to out.
c@75 445 */
c@75 446 void encode_utf8(long pt, string & out) {
c@75 447 if (pt < 0)
c@75 448 return;
c@75 449
c@75 450 if (pt < 0x80) {
c@75 451 out += static_cast<char>(pt);
c@75 452 } else if (pt < 0x800) {
c@75 453 out += static_cast<char>((pt >> 6) | 0xC0);
c@75 454 out += static_cast<char>((pt & 0x3F) | 0x80);
c@75 455 } else if (pt < 0x10000) {
c@75 456 out += static_cast<char>((pt >> 12) | 0xE0);
c@75 457 out += static_cast<char>(((pt >> 6) & 0x3F) | 0x80);
c@75 458 out += static_cast<char>((pt & 0x3F) | 0x80);
c@75 459 } else {
c@75 460 out += static_cast<char>((pt >> 18) | 0xF0);
c@75 461 out += static_cast<char>(((pt >> 12) & 0x3F) | 0x80);
c@75 462 out += static_cast<char>(((pt >> 6) & 0x3F) | 0x80);
c@75 463 out += static_cast<char>((pt & 0x3F) | 0x80);
c@75 464 }
c@75 465 }
c@75 466
c@75 467 /* parse_string()
c@75 468 *
c@75 469 * Parse a string, starting at the current position.
c@75 470 */
c@75 471 string parse_string() {
c@75 472 string out;
c@75 473 long last_escaped_codepoint = -1;
c@75 474 while (true) {
c@75 475 if (i == str.size())
c@75 476 return fail("unexpected end of input in string", "");
c@75 477
c@75 478 char ch = str[i++];
c@75 479
c@75 480 if (ch == '"') {
c@75 481 encode_utf8(last_escaped_codepoint, out);
c@75 482 return out;
c@75 483 }
c@75 484
c@75 485 if (in_range(ch, 0, 0x1f))
c@75 486 return fail("unescaped " + esc(ch) + " in string", "");
c@75 487
c@75 488 // The usual case: non-escaped characters
c@75 489 if (ch != '\\') {
c@75 490 encode_utf8(last_escaped_codepoint, out);
c@75 491 last_escaped_codepoint = -1;
c@75 492 out += ch;
c@75 493 continue;
c@75 494 }
c@75 495
c@75 496 // Handle escapes
c@75 497 if (i == str.size())
c@75 498 return fail("unexpected end of input in string", "");
c@75 499
c@75 500 ch = str[i++];
c@75 501
c@75 502 if (ch == 'u') {
c@75 503 // Extract 4-byte escape sequence
c@75 504 string esc = str.substr(i, 4);
c@75 505 // Explicitly check length of the substring. The following loop
c@75 506 // relies on std::string returning the terminating NUL when
c@75 507 // accessing str[length]. Checking here reduces brittleness.
c@75 508 if (esc.length() < 4) {
c@75 509 return fail("bad \\u escape: " + esc, "");
c@75 510 }
c@75 511 for (int j = 0; j < 4; j++) {
c@75 512 if (!in_range(esc[j], 'a', 'f') && !in_range(esc[j], 'A', 'F')
c@75 513 && !in_range(esc[j], '0', '9'))
c@75 514 return fail("bad \\u escape: " + esc, "");
c@75 515 }
c@75 516
c@75 517 long codepoint = strtol(esc.data(), nullptr, 16);
c@75 518
c@75 519 // JSON specifies that characters outside the BMP shall be encoded as a pair
c@75 520 // of 4-hex-digit \u escapes encoding their surrogate pair components. Check
c@75 521 // whether we're in the middle of such a beast: the previous codepoint was an
c@75 522 // escaped lead (high) surrogate, and this is a trail (low) surrogate.
c@75 523 if (in_range(last_escaped_codepoint, 0xD800, 0xDBFF)
c@75 524 && in_range(codepoint, 0xDC00, 0xDFFF)) {
c@75 525 // Reassemble the two surrogate pairs into one astral-plane character, per
c@75 526 // the UTF-16 algorithm.
c@75 527 encode_utf8((((last_escaped_codepoint - 0xD800) << 10)
c@75 528 | (codepoint - 0xDC00)) + 0x10000, out);
c@75 529 last_escaped_codepoint = -1;
c@75 530 } else {
c@75 531 encode_utf8(last_escaped_codepoint, out);
c@75 532 last_escaped_codepoint = codepoint;
c@75 533 }
c@75 534
c@75 535 i += 4;
c@75 536 continue;
c@75 537 }
c@75 538
c@75 539 encode_utf8(last_escaped_codepoint, out);
c@75 540 last_escaped_codepoint = -1;
c@75 541
c@75 542 if (ch == 'b') {
c@75 543 out += '\b';
c@75 544 } else if (ch == 'f') {
c@75 545 out += '\f';
c@75 546 } else if (ch == 'n') {
c@75 547 out += '\n';
c@75 548 } else if (ch == 'r') {
c@75 549 out += '\r';
c@75 550 } else if (ch == 't') {
c@75 551 out += '\t';
c@75 552 } else if (ch == '"' || ch == '\\' || ch == '/') {
c@75 553 out += ch;
c@75 554 } else {
c@75 555 return fail("invalid escape character " + esc(ch), "");
c@75 556 }
c@75 557 }
c@75 558 }
c@75 559
c@75 560 /* parse_number()
c@75 561 *
c@75 562 * Parse a double.
c@75 563 */
c@75 564 Json parse_number() {
c@75 565 size_t start_pos = i;
c@75 566
c@75 567 if (str[i] == '-')
c@75 568 i++;
c@75 569
c@75 570 // Integer part
c@75 571 if (str[i] == '0') {
c@75 572 i++;
c@75 573 if (in_range(str[i], '0', '9'))
c@75 574 return fail("leading 0s not permitted in numbers");
c@75 575 } else if (in_range(str[i], '1', '9')) {
c@75 576 i++;
c@75 577 while (in_range(str[i], '0', '9'))
c@75 578 i++;
c@75 579 } else {
c@75 580 return fail("invalid " + esc(str[i]) + " in number");
c@75 581 }
c@75 582
c@75 583 if (str[i] != '.' && str[i] != 'e' && str[i] != 'E'
c@75 584 && (i - start_pos) <= static_cast<size_t>(std::numeric_limits<int>::digits10)) {
c@75 585 return std::atoi(str.c_str() + start_pos);
c@75 586 }
c@75 587
c@75 588 // Decimal part
c@75 589 if (str[i] == '.') {
c@75 590 i++;
c@75 591 if (!in_range(str[i], '0', '9'))
c@75 592 return fail("at least one digit required in fractional part");
c@75 593
c@75 594 while (in_range(str[i], '0', '9'))
c@75 595 i++;
c@75 596 }
c@75 597
c@75 598 // Exponent part
c@75 599 if (str[i] == 'e' || str[i] == 'E') {
c@75 600 i++;
c@75 601
c@75 602 if (str[i] == '+' || str[i] == '-')
c@75 603 i++;
c@75 604
c@75 605 if (!in_range(str[i], '0', '9'))
c@75 606 return fail("at least one digit required in exponent");
c@75 607
c@75 608 while (in_range(str[i], '0', '9'))
c@75 609 i++;
c@75 610 }
c@75 611
c@75 612 return std::strtod(str.c_str() + start_pos, nullptr);
c@75 613 }
c@75 614
c@75 615 /* expect(str, res)
c@75 616 *
c@75 617 * Expect that 'str' starts at the character that was just read. If it does, advance
c@75 618 * the input and return res. If not, flag an error.
c@75 619 */
c@75 620 Json expect(const string &expected, Json res) {
c@75 621 assert(i != 0);
c@75 622 i--;
c@75 623 if (str.compare(i, expected.length(), expected) == 0) {
c@75 624 i += expected.length();
c@75 625 return res;
c@75 626 } else {
c@75 627 return fail("parse error: expected " + expected + ", got " + str.substr(i, expected.length()));
c@75 628 }
c@75 629 }
c@75 630
c@75 631 /* parse_json()
c@75 632 *
c@75 633 * Parse a JSON object.
c@75 634 */
c@75 635 Json parse_json(int depth) {
c@75 636 if (depth > max_depth) {
c@75 637 return fail("exceeded maximum nesting depth");
c@75 638 }
c@75 639
c@75 640 char ch = get_next_token();
c@75 641 if (failed)
c@75 642 return Json();
c@75 643
c@75 644 if (ch == '-' || (ch >= '0' && ch <= '9')) {
c@75 645 i--;
c@75 646 return parse_number();
c@75 647 }
c@75 648
c@75 649 if (ch == 't')
c@75 650 return expect("true", true);
c@75 651
c@75 652 if (ch == 'f')
c@75 653 return expect("false", false);
c@75 654
c@75 655 if (ch == 'n')
c@75 656 return expect("null", Json());
c@75 657
c@75 658 if (ch == '"')
c@75 659 return parse_string();
c@75 660
c@75 661 if (ch == '{') {
c@75 662 map<string, Json> data;
c@75 663 ch = get_next_token();
c@75 664 if (ch == '}')
c@75 665 return data;
c@75 666
c@75 667 while (1) {
c@75 668 if (ch != '"')
c@75 669 return fail("expected '\"' in object, got " + esc(ch));
c@75 670
c@75 671 string key = parse_string();
c@75 672 if (failed)
c@75 673 return Json();
c@75 674
c@75 675 ch = get_next_token();
c@75 676 if (ch != ':')
c@75 677 return fail("expected ':' in object, got " + esc(ch));
c@75 678
c@75 679 data[std::move(key)] = parse_json(depth + 1);
c@75 680 if (failed)
c@75 681 return Json();
c@75 682
c@75 683 ch = get_next_token();
c@75 684 if (ch == '}')
c@75 685 break;
c@75 686 if (ch != ',')
c@75 687 return fail("expected ',' in object, got " + esc(ch));
c@75 688
c@75 689 ch = get_next_token();
c@75 690 }
c@75 691 return data;
c@75 692 }
c@75 693
c@75 694 if (ch == '[') {
c@75 695 vector<Json> data;
c@75 696 ch = get_next_token();
c@75 697 if (ch == ']')
c@75 698 return data;
c@75 699
c@75 700 while (1) {
c@75 701 i--;
c@75 702 data.push_back(parse_json(depth + 1));
c@75 703 if (failed)
c@75 704 return Json();
c@75 705
c@75 706 ch = get_next_token();
c@75 707 if (ch == ']')
c@75 708 break;
c@75 709 if (ch != ',')
c@75 710 return fail("expected ',' in list, got " + esc(ch));
c@75 711
c@75 712 ch = get_next_token();
c@75 713 (void)ch;
c@75 714 }
c@75 715 return data;
c@75 716 }
c@75 717
c@75 718 return fail("expected value, got " + esc(ch));
c@75 719 }
c@75 720 };
c@75 721
c@75 722 Json Json::parse(const string &in, string &err, JsonParse strategy) {
c@75 723 JsonParser parser { in, 0, err, false, strategy };
c@75 724 Json result = parser.parse_json(0);
c@75 725
c@75 726 // Check for any trailing garbage
c@75 727 parser.consume_garbage();
c@75 728 if (parser.i != in.size())
c@75 729 return parser.fail("unexpected trailing " + esc(in[parser.i]));
c@75 730
c@75 731 return result;
c@75 732 }
c@75 733
c@75 734 // Documented in json11.hpp
c@75 735 vector<Json> Json::parse_multi(const string &in,
c@75 736 string &err,
c@75 737 JsonParse strategy) {
c@75 738 JsonParser parser { in, 0, err, false, strategy };
c@75 739
c@75 740 vector<Json> json_vec;
c@75 741 while (parser.i != in.size() && !parser.failed) {
c@75 742 json_vec.push_back(parser.parse_json(0));
c@75 743 // Check for another object
c@75 744 parser.consume_garbage();
c@75 745 }
c@75 746 return json_vec;
c@75 747 }
c@75 748
c@75 749 /* * * * * * * * * * * * * * * * * * * *
c@75 750 * Shape-checking
c@75 751 */
c@75 752
c@75 753 bool Json::has_shape(const shape & types, string & err) const {
c@75 754 if (!is_object()) {
c@75 755 err = "expected JSON object, got " + dump();
c@75 756 return false;
c@75 757 }
c@75 758
c@75 759 for (auto & item : types) {
c@75 760 if ((*this)[item.first].type() != item.second) {
c@75 761 err = "bad type for " + item.first + " in " + dump();
c@75 762 return false;
c@75 763 }
c@75 764 }
c@75 765
c@75 766 return true;
c@75 767 }
c@75 768
c@75 769 } // namespace json11