123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788 |
- /* Copyright (c) 2013 Dropbox, Inc.
- *
- * Permission is hereby granted, free of charge, to any person obtaining a copy
- * of this software and associated documentation files (the "Software"), to deal
- * in the Software without restriction, including without limitation the rights
- * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the Software is
- * furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
- * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
- * THE SOFTWARE.
- */
- #include "json11.hpp"
- #include <cassert>
- #include <cmath>
- #include <cstdlib>
- #include <cstdio>
- #include <limits>
- namespace json11 {
- static const int max_depth = 200;
- using std::string;
- using std::vector;
- using std::map;
- using std::make_shared;
- using std::initializer_list;
- using std::move;
- /* Helper for representing null - just a do-nothing struct, plus comparison
- * operators so the helpers in JsonValue work. We can't use nullptr_t because
- * it may not be orderable.
- */
- struct NullStruct {
- bool operator==(NullStruct) const { return true; }
- bool operator<(NullStruct) const { return false; }
- };
- /* * * * * * * * * * * * * * * * * * * *
- * Serialization
- */
- static void dump(NullStruct, string &out) {
- out += "null";
- }
- static void dump(double value, string &out) {
- if (std::isfinite(value)) {
- char buf[32];
- snprintf(buf, sizeof buf, "%.17g", value);
- out += buf;
- } else {
- out += "null";
- }
- }
- static void dump(int value, string &out) {
- char buf[32];
- snprintf(buf, sizeof buf, "%d", value);
- out += buf;
- }
- static void dump(bool value, string &out) {
- out += value ? "true" : "false";
- }
- static void dump(const string &value, string &out) {
- out += '"';
- for (size_t i = 0; i < value.length(); i++) {
- const char ch = value[i];
- if (ch == '\\') {
- out += "\\\\";
- } else if (ch == '"') {
- out += "\\\"";
- } else if (ch == '\b') {
- out += "\\b";
- } else if (ch == '\f') {
- out += "\\f";
- } else if (ch == '\n') {
- out += "\\n";
- } else if (ch == '\r') {
- out += "\\r";
- } else if (ch == '\t') {
- out += "\\t";
- } else if (static_cast<uint8_t>(ch) <= 0x1f) {
- char buf[8];
- snprintf(buf, sizeof buf, "\\u%04x", ch);
- out += buf;
- } else if (static_cast<uint8_t>(ch) == 0xe2 && static_cast<uint8_t>(value[i+1]) == 0x80
- && static_cast<uint8_t>(value[i+2]) == 0xa8) {
- out += "\\u2028";
- i += 2;
- } else if (static_cast<uint8_t>(ch) == 0xe2 && static_cast<uint8_t>(value[i+1]) == 0x80
- && static_cast<uint8_t>(value[i+2]) == 0xa9) {
- out += "\\u2029";
- i += 2;
- } else {
- out += ch;
- }
- }
- out += '"';
- }
- static void dump(const Json::array &values, string &out) {
- bool first = true;
- out += "[";
- for (const auto &value : values) {
- if (!first)
- out += ",";
- value.dump(out);
- first = false;
- }
- out += "]";
- }
- static void dump(const Json::object &values, string &out) {
- bool first = true;
- out += "{";
- for (const auto &kv : values) {
- if (!first)
- out += ",";
- dump(kv.first, out);
- out += ":";
- kv.second.dump(out);
- first = false;
- }
- out += "}";
- }
- void Json::dump(string &out) const {
- m_ptr->dump(out);
- }
- /* * * * * * * * * * * * * * * * * * * *
- * Value wrappers
- */
- template <Json::Type tag, typename T>
- class Value : public JsonValue {
- protected:
- // Constructors
- explicit Value(const T &value) : m_value(value) {}
- explicit Value(T &&value) : m_value(move(value)) {}
- // Get type tag
- Json::Type type() const override {
- return tag;
- }
- // Comparisons
- bool equals(const JsonValue * other) const override {
- return m_value == static_cast<const Value<tag, T> *>(other)->m_value;
- }
- bool less(const JsonValue * other) const override {
- return m_value < static_cast<const Value<tag, T> *>(other)->m_value;
- }
- const T m_value;
- void dump(string &out) const override { json11::dump(m_value, out); }
- };
- class JsonDouble final : public Value<Json::NUMBER, double> {
- double number_value() const override { return m_value; }
- int int_value() const override { return static_cast<int>(m_value); }
- bool equals(const JsonValue * other) const override { return m_value == other->number_value(); }
- bool less(const JsonValue * other) const override { return m_value < other->number_value(); }
- public:
- explicit JsonDouble(double value) : Value(value) {}
- };
- class JsonInt final : public Value<Json::NUMBER, int> {
- double number_value() const override { return m_value; }
- int int_value() const override { return m_value; }
- bool equals(const JsonValue * other) const override { return m_value == other->number_value(); }
- bool less(const JsonValue * other) const override { return m_value < other->number_value(); }
- public:
- explicit JsonInt(int value) : Value(value) {}
- };
- class JsonBoolean final : public Value<Json::BOOL, bool> {
- bool bool_value() const override { return m_value; }
- public:
- explicit JsonBoolean(bool value) : Value(value) {}
- };
- class JsonString final : public Value<Json::STRING, string> {
- const string &string_value() const override { return m_value; }
- public:
- explicit JsonString(const string &value) : Value(value) {}
- explicit JsonString(string &&value) : Value(move(value)) {}
- };
- class JsonArray final : public Value<Json::ARRAY, Json::array> {
- const Json::array &array_items() const override { return m_value; }
- const Json & operator[](size_t i) const override;
- public:
- explicit JsonArray(const Json::array &value) : Value(value) {}
- explicit JsonArray(Json::array &&value) : Value(move(value)) {}
- };
- class JsonObject final : public Value<Json::OBJECT, Json::object> {
- const Json::object &object_items() const override { return m_value; }
- const Json & operator[](const string &key) const override;
- public:
- explicit JsonObject(const Json::object &value) : Value(value) {}
- explicit JsonObject(Json::object &&value) : Value(move(value)) {}
- };
- class JsonNull final : public Value<Json::NUL, NullStruct> {
- public:
- JsonNull() : Value({}) {}
- };
- /* * * * * * * * * * * * * * * * * * * *
- * Static globals - static-init-safe
- */
- struct Statics {
- const std::shared_ptr<JsonValue> null = make_shared<JsonNull>();
- const std::shared_ptr<JsonValue> t = make_shared<JsonBoolean>(true);
- const std::shared_ptr<JsonValue> f = make_shared<JsonBoolean>(false);
- const string empty_string;
- const vector<Json> empty_vector;
- const map<string, Json> empty_map;
- Statics() {}
- };
- static const Statics & statics() {
- static const Statics s {};
- return s;
- }
- static const Json & static_null() {
- // This has to be separate, not in Statics, because Json() accesses statics().null.
- static const Json json_null;
- return json_null;
- }
- /* * * * * * * * * * * * * * * * * * * *
- * Constructors
- */
- Json::Json() noexcept : m_ptr(statics().null) {}
- Json::Json(std::nullptr_t) noexcept : m_ptr(statics().null) {}
- Json::Json(double value) : m_ptr(make_shared<JsonDouble>(value)) {}
- Json::Json(int value) : m_ptr(make_shared<JsonInt>(value)) {}
- Json::Json(bool value) : m_ptr(value ? statics().t : statics().f) {}
- Json::Json(const string &value) : m_ptr(make_shared<JsonString>(value)) {}
- Json::Json(string &&value) : m_ptr(make_shared<JsonString>(move(value))) {}
- Json::Json(const char * value) : m_ptr(make_shared<JsonString>(value)) {}
- Json::Json(const Json::array &values) : m_ptr(make_shared<JsonArray>(values)) {}
- Json::Json(Json::array &&values) : m_ptr(make_shared<JsonArray>(move(values))) {}
- Json::Json(const Json::object &values) : m_ptr(make_shared<JsonObject>(values)) {}
- Json::Json(Json::object &&values) : m_ptr(make_shared<JsonObject>(move(values))) {}
- /* * * * * * * * * * * * * * * * * * * *
- * Accessors
- */
- Json::Type Json::type() const { return m_ptr->type(); }
- double Json::number_value() const { return m_ptr->number_value(); }
- int Json::int_value() const { return m_ptr->int_value(); }
- bool Json::bool_value() const { return m_ptr->bool_value(); }
- const string & Json::string_value() const { return m_ptr->string_value(); }
- const vector<Json> & Json::array_items() const { return m_ptr->array_items(); }
- const map<string, Json> & Json::object_items() const { return m_ptr->object_items(); }
- const Json & Json::operator[] (size_t i) const { return (*m_ptr)[i]; }
- const Json & Json::operator[] (const string &key) const { return (*m_ptr)[key]; }
- double JsonValue::number_value() const { return 0; }
- int JsonValue::int_value() const { return 0; }
- bool JsonValue::bool_value() const { return false; }
- const string & JsonValue::string_value() const { return statics().empty_string; }
- const vector<Json> & JsonValue::array_items() const { return statics().empty_vector; }
- const map<string, Json> & JsonValue::object_items() const { return statics().empty_map; }
- const Json & JsonValue::operator[] (size_t) const { return static_null(); }
- const Json & JsonValue::operator[] (const string &) const { return static_null(); }
- const Json & JsonObject::operator[] (const string &key) const {
- auto iter = m_value.find(key);
- return (iter == m_value.end()) ? static_null() : iter->second;
- }
- const Json & JsonArray::operator[] (size_t i) const {
- if (i >= m_value.size()) return static_null();
- else return m_value[i];
- }
- /* * * * * * * * * * * * * * * * * * * *
- * Comparison
- */
- bool Json::operator== (const Json &other) const {
- if (m_ptr == other.m_ptr)
- return true;
- if (m_ptr->type() != other.m_ptr->type())
- return false;
- return m_ptr->equals(other.m_ptr.get());
- }
- bool Json::operator< (const Json &other) const {
- if (m_ptr == other.m_ptr)
- return false;
- if (m_ptr->type() != other.m_ptr->type())
- return m_ptr->type() < other.m_ptr->type();
- return m_ptr->less(other.m_ptr.get());
- }
- /* * * * * * * * * * * * * * * * * * * *
- * Parsing
- */
- /* esc(c)
- *
- * Format char c suitable for printing in an error message.
- */
- static inline string esc(char c) {
- char buf[12];
- if (static_cast<uint8_t>(c) >= 0x20 && static_cast<uint8_t>(c) <= 0x7f) {
- snprintf(buf, sizeof buf, "'%c' (%d)", c, c);
- } else {
- snprintf(buf, sizeof buf, "(%d)", c);
- }
- return string(buf);
- }
- static inline bool in_range(long x, long lower, long upper) {
- return (x >= lower && x <= upper);
- }
- namespace {
- /* JsonParser
- *
- * Object that tracks all state of an in-progress parse.
- */
- struct JsonParser final {
- /* State
- */
- const string &str;
- size_t i;
- string &err;
- bool failed;
- const JsonParse strategy;
- /* fail(msg, err_ret = Json())
- *
- * Mark this parse as failed.
- */
- Json fail(string &&msg) {
- return fail(move(msg), Json());
- }
- template <typename T>
- T fail(string &&msg, const T err_ret) {
- if (!failed)
- err = std::move(msg);
- failed = true;
- return err_ret;
- }
- /* consume_whitespace()
- *
- * Advance until the current character is non-whitespace.
- */
- void consume_whitespace() {
- while (str[i] == ' ' || str[i] == '\r' || str[i] == '\n' || str[i] == '\t')
- i++;
- }
- /* consume_comment()
- *
- * Advance comments (c-style inline and multiline).
- */
- bool consume_comment() {
- bool comment_found = false;
- if (str[i] == '/') {
- i++;
- if (i == str.size())
- return fail("unexpected end of input after start of comment", false);
- if (str[i] == '/') { // inline comment
- i++;
- // advance until next line, or end of input
- while (i < str.size() && str[i] != '\n') {
- i++;
- }
- comment_found = true;
- }
- else if (str[i] == '*') { // multiline comment
- i++;
- if (i > str.size()-2)
- return fail("unexpected end of input inside multi-line comment", false);
- // advance until closing tokens
- while (!(str[i] == '*' && str[i+1] == '/')) {
- i++;
- if (i > str.size()-2)
- return fail(
- "unexpected end of input inside multi-line comment", false);
- }
- i += 2;
- comment_found = true;
- }
- else
- return fail("malformed comment", false);
- }
- return comment_found;
- }
- /* consume_garbage()
- *
- * Advance until the current character is non-whitespace and non-comment.
- */
- void consume_garbage() {
- consume_whitespace();
- if(strategy == JsonParse::COMMENTS) {
- bool comment_found = false;
- do {
- comment_found = consume_comment();
- if (failed) return;
- consume_whitespace();
- }
- while(comment_found);
- }
- }
- /* get_next_token()
- *
- * Return the next non-whitespace character. If the end of the input is reached,
- * flag an error and return 0.
- */
- char get_next_token() {
- consume_garbage();
- if (failed) return (char)0;
- if (i == str.size())
- return fail("unexpected end of input", (char)0);
- return str[i++];
- }
- /* encode_utf8(pt, out)
- *
- * Encode pt as UTF-8 and add it to out.
- */
- void encode_utf8(long pt, string & out) {
- if (pt < 0)
- return;
- if (pt < 0x80) {
- out += static_cast<char>(pt);
- } else if (pt < 0x800) {
- out += static_cast<char>((pt >> 6) | 0xC0);
- out += static_cast<char>((pt & 0x3F) | 0x80);
- } else if (pt < 0x10000) {
- out += static_cast<char>((pt >> 12) | 0xE0);
- out += static_cast<char>(((pt >> 6) & 0x3F) | 0x80);
- out += static_cast<char>((pt & 0x3F) | 0x80);
- } else {
- out += static_cast<char>((pt >> 18) | 0xF0);
- out += static_cast<char>(((pt >> 12) & 0x3F) | 0x80);
- out += static_cast<char>(((pt >> 6) & 0x3F) | 0x80);
- out += static_cast<char>((pt & 0x3F) | 0x80);
- }
- }
- /* parse_string()
- *
- * Parse a string, starting at the current position.
- */
- string parse_string() {
- string out;
- long last_escaped_codepoint = -1;
- while (true) {
- if (i == str.size())
- return fail("unexpected end of input in string", "");
- char ch = str[i++];
- if (ch == '"') {
- encode_utf8(last_escaped_codepoint, out);
- return out;
- }
- if (in_range(ch, 0, 0x1f))
- return fail("unescaped " + esc(ch) + " in string", "");
- // The usual case: non-escaped characters
- if (ch != '\\') {
- encode_utf8(last_escaped_codepoint, out);
- last_escaped_codepoint = -1;
- out += ch;
- continue;
- }
- // Handle escapes
- if (i == str.size())
- return fail("unexpected end of input in string", "");
- ch = str[i++];
- if (ch == 'u') {
- // Extract 4-byte escape sequence
- string esc = str.substr(i, 4);
- // Explicitly check length of the substring. The following loop
- // relies on std::string returning the terminating NUL when
- // accessing str[length]. Checking here reduces brittleness.
- if (esc.length() < 4) {
- return fail("bad \\u escape: " + esc, "");
- }
- for (size_t j = 0; j < 4; j++) {
- if (!in_range(esc[j], 'a', 'f') && !in_range(esc[j], 'A', 'F')
- && !in_range(esc[j], '0', '9'))
- return fail("bad \\u escape: " + esc, "");
- }
- long codepoint = strtol(esc.data(), nullptr, 16);
- // JSON specifies that characters outside the BMP shall be encoded as a pair
- // of 4-hex-digit \u escapes encoding their surrogate pair components. Check
- // whether we're in the middle of such a beast: the previous codepoint was an
- // escaped lead (high) surrogate, and this is a trail (low) surrogate.
- if (in_range(last_escaped_codepoint, 0xD800, 0xDBFF)
- && in_range(codepoint, 0xDC00, 0xDFFF)) {
- // Reassemble the two surrogate pairs into one astral-plane character, per
- // the UTF-16 algorithm.
- encode_utf8((((last_escaped_codepoint - 0xD800) << 10)
- | (codepoint - 0xDC00)) + 0x10000, out);
- last_escaped_codepoint = -1;
- } else {
- encode_utf8(last_escaped_codepoint, out);
- last_escaped_codepoint = codepoint;
- }
- i += 4;
- continue;
- }
- encode_utf8(last_escaped_codepoint, out);
- last_escaped_codepoint = -1;
- if (ch == 'b') {
- out += '\b';
- } else if (ch == 'f') {
- out += '\f';
- } else if (ch == 'n') {
- out += '\n';
- } else if (ch == 'r') {
- out += '\r';
- } else if (ch == 't') {
- out += '\t';
- } else if (ch == '"' || ch == '\\' || ch == '/') {
- out += ch;
- } else {
- return fail("invalid escape character " + esc(ch), "");
- }
- }
- }
- /* parse_number()
- *
- * Parse a double.
- */
- Json parse_number() {
- size_t start_pos = i;
- if (str[i] == '-')
- i++;
- // Integer part
- if (str[i] == '0') {
- i++;
- if (in_range(str[i], '0', '9'))
- return fail("leading 0s not permitted in numbers");
- } else if (in_range(str[i], '1', '9')) {
- i++;
- while (in_range(str[i], '0', '9'))
- i++;
- } else {
- return fail("invalid " + esc(str[i]) + " in number");
- }
- if (str[i] != '.' && str[i] != 'e' && str[i] != 'E'
- && (i - start_pos) <= static_cast<size_t>(std::numeric_limits<int>::digits10)) {
- return std::atoi(str.c_str() + start_pos);
- }
- // Decimal part
- if (str[i] == '.') {
- i++;
- if (!in_range(str[i], '0', '9'))
- return fail("at least one digit required in fractional part");
- while (in_range(str[i], '0', '9'))
- i++;
- }
- // Exponent part
- if (str[i] == 'e' || str[i] == 'E') {
- i++;
- if (str[i] == '+' || str[i] == '-')
- i++;
- if (!in_range(str[i], '0', '9'))
- return fail("at least one digit required in exponent");
- while (in_range(str[i], '0', '9'))
- i++;
- }
- return std::strtod(str.c_str() + start_pos, nullptr);
- }
- /* expect(str, res)
- *
- * Expect that 'str' starts at the character that was just read. If it does, advance
- * the input and return res. If not, flag an error.
- */
- Json expect(const string &expected, Json res) {
- assert(i != 0);
- i--;
- if (str.compare(i, expected.length(), expected) == 0) {
- i += expected.length();
- return res;
- } else {
- return fail("parse error: expected " + expected + ", got " + str.substr(i, expected.length()));
- }
- }
- /* parse_json()
- *
- * Parse a JSON object.
- */
- Json parse_json(int depth) {
- if (depth > max_depth) {
- return fail("exceeded maximum nesting depth");
- }
- char ch = get_next_token();
- if (failed)
- return Json();
- if (ch == '-' || (ch >= '0' && ch <= '9')) {
- i--;
- return parse_number();
- }
- if (ch == 't')
- return expect("true", true);
- if (ch == 'f')
- return expect("false", false);
- if (ch == 'n')
- return expect("null", Json());
- if (ch == '"')
- return parse_string();
- if (ch == '{') {
- map<string, Json> data;
- ch = get_next_token();
- if (ch == '}')
- return data;
- while (1) {
- if (ch != '"')
- return fail("expected '\"' in object, got " + esc(ch));
- string key = parse_string();
- if (failed)
- return Json();
- ch = get_next_token();
- if (ch != ':')
- return fail("expected ':' in object, got " + esc(ch));
- data[std::move(key)] = parse_json(depth + 1);
- if (failed)
- return Json();
- ch = get_next_token();
- if (ch == '}')
- break;
- if (ch != ',')
- return fail("expected ',' in object, got " + esc(ch));
- ch = get_next_token();
- }
- return data;
- }
- if (ch == '[') {
- vector<Json> data;
- ch = get_next_token();
- if (ch == ']')
- return data;
- while (1) {
- i--;
- data.push_back(parse_json(depth + 1));
- if (failed)
- return Json();
- ch = get_next_token();
- if (ch == ']')
- break;
- if (ch != ',')
- return fail("expected ',' in list, got " + esc(ch));
- ch = get_next_token();
- (void)ch;
- }
- return data;
- }
- return fail("expected value, got " + esc(ch));
- }
- };
- }//namespace {
- Json Json::parse(const string &in, string &err, JsonParse strategy) {
- JsonParser parser { in, 0, err, false, strategy };
- Json result = parser.parse_json(0);
- // Check for any trailing garbage
- parser.consume_garbage();
- if (parser.failed)
- return Json();
- if (parser.i != in.size())
- return parser.fail("unexpected trailing " + esc(in[parser.i]));
- return result;
- }
- // Documented in json11.hpp
- vector<Json> Json::parse_multi(const string &in,
- std::string::size_type &parser_stop_pos,
- string &err,
- JsonParse strategy) {
- JsonParser parser { in, 0, err, false, strategy };
- parser_stop_pos = 0;
- vector<Json> json_vec;
- while (parser.i != in.size() && !parser.failed) {
- json_vec.push_back(parser.parse_json(0));
- if (parser.failed)
- break;
- // Check for another object
- parser.consume_garbage();
- if (parser.failed)
- break;
- parser_stop_pos = parser.i;
- }
- return json_vec;
- }
- /* * * * * * * * * * * * * * * * * * * *
- * Shape-checking
- */
- bool Json::has_shape(const shape & types, string & err) const {
- if (!is_object()) {
- err = "expected JSON object, got " + dump();
- return false;
- }
- for (auto & item : types) {
- if ((*this)[item.first].type() != item.second) {
- err = "bad type for " + item.first + " in " + dump();
- return false;
- }
- }
- return true;
- }
- } // namespace json11
|