123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004 |
- // Copyright 2007-2011 Baptiste Lepilleur and The JsonCpp Authors
- // Copyright (C) 2016 InfoTeCS JSC. All rights reserved.
- // Distributed under MIT license, or public domain if desired and
- // recognized in your jurisdiction.
- // See file LICENSE for detail or copy at http://jsoncpp.sourceforge.net/LICENSE
- #if !defined(JSON_IS_AMALGAMATION)
- #include "json_tool.h"
- #include <json/assertions.h>
- #include <json/reader.h>
- #include <json/value.h>
- #endif // if !defined(JSON_IS_AMALGAMATION)
- #include <algorithm>
- #include <cassert>
- #include <cmath>
- #include <cstring>
- #include <iostream>
- #include <istream>
- #include <limits>
- #include <memory>
- #include <set>
- #include <sstream>
- #include <utility>
- #include <cstdio>
- #if __cplusplus >= 201103L
- #if !defined(sscanf)
- #define sscanf std::sscanf
- #endif
- #endif //__cplusplus
- #if defined(_MSC_VER)
- #if !defined(_CRT_SECURE_CPP_OVERLOAD_STANDARD_NAMES)
- #define _CRT_SECURE_CPP_OVERLOAD_STANDARD_NAMES 1
- #endif //_CRT_SECURE_CPP_OVERLOAD_STANDARD_NAMES
- #endif //_MSC_VER
- #if defined(_MSC_VER)
- // Disable warning about strdup being deprecated.
- #pragma warning(disable : 4996)
- #endif
- // Define JSONCPP_DEPRECATED_STACK_LIMIT as an appropriate integer at compile
- // time to change the stack limit
- #if !defined(JSONCPP_DEPRECATED_STACK_LIMIT)
- #define JSONCPP_DEPRECATED_STACK_LIMIT 1000
- #endif
- static size_t const stackLimit_g =
- JSONCPP_DEPRECATED_STACK_LIMIT; // see readValue()
- namespace Json {
- #if __cplusplus >= 201103L || (defined(_CPPLIB_VER) && _CPPLIB_VER >= 520)
- using CharReaderPtr = std::unique_ptr<CharReader>;
- #else
- using CharReaderPtr = std::auto_ptr<CharReader>;
- #endif
- // Implementation of class Features
- // ////////////////////////////////
- Features::Features() = default;
- Features Features::all() { return {}; }
- Features Features::strictMode() {
- Features features;
- features.allowComments_ = false;
- features.strictRoot_ = true;
- features.allowDroppedNullPlaceholders_ = false;
- features.allowNumericKeys_ = false;
- return features;
- }
- // Implementation of class Reader
- // ////////////////////////////////
- bool Reader::containsNewLine(Reader::Location begin, Reader::Location end) {
- return std::any_of(begin, end, [](char b) { return b == '\n' || b == '\r'; });
- }
- // Class Reader
- // //////////////////////////////////////////////////////////////////
- Reader::Reader() : features_(Features::all()) {}
- Reader::Reader(const Features& features) : features_(features) {}
- bool Reader::parse(const std::string& document, Value& root,
- bool collectComments) {
- document_.assign(document.begin(), document.end());
- const char* begin = document_.c_str();
- const char* end = begin + document_.length();
- return parse(begin, end, root, collectComments);
- }
- bool Reader::parse(std::istream& is, Value& root, bool collectComments) {
- // std::istream_iterator<char> begin(is);
- // std::istream_iterator<char> end;
- // Those would allow streamed input from a file, if parse() were a
- // template function.
- // Since String is reference-counted, this at least does not
- // create an extra copy.
- String doc(std::istreambuf_iterator<char>(is), {});
- return parse(doc.data(), doc.data() + doc.size(), root, collectComments);
- }
- bool Reader::parse(const char* beginDoc, const char* endDoc, Value& root,
- bool collectComments) {
- if (!features_.allowComments_) {
- collectComments = false;
- }
- begin_ = beginDoc;
- end_ = endDoc;
- collectComments_ = collectComments;
- current_ = begin_;
- lastValueEnd_ = nullptr;
- lastValue_ = nullptr;
- commentsBefore_.clear();
- errors_.clear();
- while (!nodes_.empty())
- nodes_.pop();
- nodes_.push(&root);
- bool successful = readValue();
- Token token;
- skipCommentTokens(token);
- if (collectComments_ && !commentsBefore_.empty())
- root.setComment(commentsBefore_, commentAfter);
- if (features_.strictRoot_) {
- if (!root.isArray() && !root.isObject()) {
- // Set error location to start of doc, ideally should be first token found
- // in doc
- token.type_ = tokenError;
- token.start_ = beginDoc;
- token.end_ = endDoc;
- addError(
- "A valid JSON document must be either an array or an object value.",
- token);
- return false;
- }
- }
- return successful;
- }
- bool Reader::readValue() {
- // readValue() may call itself only if it calls readObject() or ReadArray().
- // These methods execute nodes_.push() just before and nodes_.pop)() just
- // after calling readValue(). parse() executes one nodes_.push(), so > instead
- // of >=.
- if (nodes_.size() > stackLimit_g)
- throwRuntimeError("Exceeded stackLimit in readValue().");
- Token token;
- skipCommentTokens(token);
- bool successful = true;
- if (collectComments_ && !commentsBefore_.empty()) {
- currentValue().setComment(commentsBefore_, commentBefore);
- commentsBefore_.clear();
- }
- switch (token.type_) {
- case tokenObjectBegin:
- successful = readObject(token);
- currentValue().setOffsetLimit(current_ - begin_);
- break;
- case tokenArrayBegin:
- successful = readArray(token);
- currentValue().setOffsetLimit(current_ - begin_);
- break;
- case tokenNumber:
- successful = decodeNumber(token);
- break;
- case tokenString:
- successful = decodeString(token);
- break;
- case tokenTrue: {
- Value v(true);
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- } break;
- case tokenFalse: {
- Value v(false);
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- } break;
- case tokenNull: {
- Value v;
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- } break;
- case tokenArraySeparator:
- case tokenObjectEnd:
- case tokenArrayEnd:
- if (features_.allowDroppedNullPlaceholders_) {
- // "Un-read" the current token and mark the current value as a null
- // token.
- current_--;
- Value v;
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(current_ - begin_ - 1);
- currentValue().setOffsetLimit(current_ - begin_);
- break;
- } // Else, fall through...
- default:
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- return addError("Syntax error: value, object or array expected.", token);
- }
- if (collectComments_) {
- lastValueEnd_ = current_;
- lastValue_ = ¤tValue();
- }
- return successful;
- }
- void Reader::skipCommentTokens(Token& token) {
- if (features_.allowComments_) {
- do {
- readToken(token);
- } while (token.type_ == tokenComment);
- } else {
- readToken(token);
- }
- }
- bool Reader::readToken(Token& token) {
- skipSpaces();
- token.start_ = current_;
- Char c = getNextChar();
- bool ok = true;
- switch (c) {
- case '{':
- token.type_ = tokenObjectBegin;
- break;
- case '}':
- token.type_ = tokenObjectEnd;
- break;
- case '[':
- token.type_ = tokenArrayBegin;
- break;
- case ']':
- token.type_ = tokenArrayEnd;
- break;
- case '"':
- token.type_ = tokenString;
- ok = readString();
- break;
- case '/':
- token.type_ = tokenComment;
- ok = readComment();
- break;
- case '0':
- case '1':
- case '2':
- case '3':
- case '4':
- case '5':
- case '6':
- case '7':
- case '8':
- case '9':
- case '-':
- token.type_ = tokenNumber;
- readNumber();
- break;
- case 't':
- token.type_ = tokenTrue;
- ok = match("rue", 3);
- break;
- case 'f':
- token.type_ = tokenFalse;
- ok = match("alse", 4);
- break;
- case 'n':
- token.type_ = tokenNull;
- ok = match("ull", 3);
- break;
- case ',':
- token.type_ = tokenArraySeparator;
- break;
- case ':':
- token.type_ = tokenMemberSeparator;
- break;
- case 0:
- token.type_ = tokenEndOfStream;
- break;
- default:
- ok = false;
- break;
- }
- if (!ok)
- token.type_ = tokenError;
- token.end_ = current_;
- return ok;
- }
- void Reader::skipSpaces() {
- while (current_ != end_) {
- Char c = *current_;
- if (c == ' ' || c == '\t' || c == '\r' || c == '\n')
- ++current_;
- else
- break;
- }
- }
- bool Reader::match(const Char* pattern, int patternLength) {
- if (end_ - current_ < patternLength)
- return false;
- int index = patternLength;
- while (index--)
- if (current_[index] != pattern[index])
- return false;
- current_ += patternLength;
- return true;
- }
- bool Reader::readComment() {
- Location commentBegin = current_ - 1;
- Char c = getNextChar();
- bool successful = false;
- if (c == '*')
- successful = readCStyleComment();
- else if (c == '/')
- successful = readCppStyleComment();
- if (!successful)
- return false;
- if (collectComments_) {
- CommentPlacement placement = commentBefore;
- if (lastValueEnd_ && !containsNewLine(lastValueEnd_, commentBegin)) {
- if (c != '*' || !containsNewLine(commentBegin, current_))
- placement = commentAfterOnSameLine;
- }
- addComment(commentBegin, current_, placement);
- }
- return true;
- }
- String Reader::normalizeEOL(Reader::Location begin, Reader::Location end) {
- String normalized;
- normalized.reserve(static_cast<size_t>(end - begin));
- Reader::Location current = begin;
- while (current != end) {
- char c = *current++;
- if (c == '\r') {
- if (current != end && *current == '\n')
- // convert dos EOL
- ++current;
- // convert Mac EOL
- normalized += '\n';
- } else {
- normalized += c;
- }
- }
- return normalized;
- }
- void Reader::addComment(Location begin, Location end,
- CommentPlacement placement) {
- assert(collectComments_);
- const String& normalized = normalizeEOL(begin, end);
- if (placement == commentAfterOnSameLine) {
- assert(lastValue_ != nullptr);
- lastValue_->setComment(normalized, placement);
- } else {
- commentsBefore_ += normalized;
- }
- }
- bool Reader::readCStyleComment() {
- while ((current_ + 1) < end_) {
- Char c = getNextChar();
- if (c == '*' && *current_ == '/')
- break;
- }
- return getNextChar() == '/';
- }
- bool Reader::readCppStyleComment() {
- while (current_ != end_) {
- Char c = getNextChar();
- if (c == '\n')
- break;
- if (c == '\r') {
- // Consume DOS EOL. It will be normalized in addComment.
- if (current_ != end_ && *current_ == '\n')
- getNextChar();
- // Break on Moc OS 9 EOL.
- break;
- }
- }
- return true;
- }
- void Reader::readNumber() {
- Location p = current_;
- char c = '0'; // stopgap for already consumed character
- // integral part
- while (c >= '0' && c <= '9')
- c = (current_ = p) < end_ ? *p++ : '\0';
- // fractional part
- if (c == '.') {
- c = (current_ = p) < end_ ? *p++ : '\0';
- while (c >= '0' && c <= '9')
- c = (current_ = p) < end_ ? *p++ : '\0';
- }
- // exponential part
- if (c == 'e' || c == 'E') {
- c = (current_ = p) < end_ ? *p++ : '\0';
- if (c == '+' || c == '-')
- c = (current_ = p) < end_ ? *p++ : '\0';
- while (c >= '0' && c <= '9')
- c = (current_ = p) < end_ ? *p++ : '\0';
- }
- }
- bool Reader::readString() {
- Char c = '\0';
- while (current_ != end_) {
- c = getNextChar();
- if (c == '\\')
- getNextChar();
- else if (c == '"')
- break;
- }
- return c == '"';
- }
- bool Reader::readObject(Token& token) {
- Token tokenName;
- String name;
- Value init(objectValue);
- currentValue().swapPayload(init);
- currentValue().setOffsetStart(token.start_ - begin_);
- while (readToken(tokenName)) {
- bool initialTokenOk = true;
- while (tokenName.type_ == tokenComment && initialTokenOk)
- initialTokenOk = readToken(tokenName);
- if (!initialTokenOk)
- break;
- if (tokenName.type_ == tokenObjectEnd && name.empty()) // empty object
- return true;
- name.clear();
- if (tokenName.type_ == tokenString) {
- if (!decodeString(tokenName, name))
- return recoverFromError(tokenObjectEnd);
- } else if (tokenName.type_ == tokenNumber && features_.allowNumericKeys_) {
- Value numberName;
- if (!decodeNumber(tokenName, numberName))
- return recoverFromError(tokenObjectEnd);
- name = numberName.asString();
- } else {
- break;
- }
- Token colon;
- if (!readToken(colon) || colon.type_ != tokenMemberSeparator) {
- return addErrorAndRecover("Missing ':' after object member name", colon,
- tokenObjectEnd);
- }
- Value& value = currentValue()[name];
- nodes_.push(&value);
- bool ok = readValue();
- nodes_.pop();
- if (!ok) // error already set
- return recoverFromError(tokenObjectEnd);
- Token comma;
- if (!readToken(comma) ||
- (comma.type_ != tokenObjectEnd && comma.type_ != tokenArraySeparator &&
- comma.type_ != tokenComment)) {
- return addErrorAndRecover("Missing ',' or '}' in object declaration",
- comma, tokenObjectEnd);
- }
- bool finalizeTokenOk = true;
- while (comma.type_ == tokenComment && finalizeTokenOk)
- finalizeTokenOk = readToken(comma);
- if (comma.type_ == tokenObjectEnd)
- return true;
- }
- return addErrorAndRecover("Missing '}' or object member name", tokenName,
- tokenObjectEnd);
- }
- bool Reader::readArray(Token& token) {
- Value init(arrayValue);
- currentValue().swapPayload(init);
- currentValue().setOffsetStart(token.start_ - begin_);
- skipSpaces();
- if (current_ != end_ && *current_ == ']') // empty array
- {
- Token endArray;
- readToken(endArray);
- return true;
- }
- int index = 0;
- for (;;) {
- Value& value = currentValue()[index++];
- nodes_.push(&value);
- bool ok = readValue();
- nodes_.pop();
- if (!ok) // error already set
- return recoverFromError(tokenArrayEnd);
- Token currentToken;
- // Accept Comment after last item in the array.
- ok = readToken(currentToken);
- while (currentToken.type_ == tokenComment && ok) {
- ok = readToken(currentToken);
- }
- bool badTokenType = (currentToken.type_ != tokenArraySeparator &&
- currentToken.type_ != tokenArrayEnd);
- if (!ok || badTokenType) {
- return addErrorAndRecover("Missing ',' or ']' in array declaration",
- currentToken, tokenArrayEnd);
- }
- if (currentToken.type_ == tokenArrayEnd)
- break;
- }
- return true;
- }
- bool Reader::decodeNumber(Token& token) {
- Value decoded;
- if (!decodeNumber(token, decoded))
- return false;
- currentValue().swapPayload(decoded);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- return true;
- }
- bool Reader::decodeNumber(Token& token, Value& decoded) {
- // Attempts to parse the number as an integer. If the number is
- // larger than the maximum supported value of an integer then
- // we decode the number as a double.
- Location current = token.start_;
- bool isNegative = *current == '-';
- if (isNegative)
- ++current;
- // TODO: Help the compiler do the div and mod at compile time or get rid of
- // them.
- Value::LargestUInt maxIntegerValue =
- isNegative ? Value::LargestUInt(Value::maxLargestInt) + 1
- : Value::maxLargestUInt;
- Value::LargestUInt threshold = maxIntegerValue / 10;
- Value::LargestUInt value = 0;
- while (current < token.end_) {
- Char c = *current++;
- if (c < '0' || c > '9')
- return decodeDouble(token, decoded);
- auto digit(static_cast<Value::UInt>(c - '0'));
- if (value >= threshold) {
- // We've hit or exceeded the max value divided by 10 (rounded down). If
- // a) we've only just touched the limit, b) this is the last digit, and
- // c) it's small enough to fit in that rounding delta, we're okay.
- // Otherwise treat this number as a double to avoid overflow.
- if (value > threshold || current != token.end_ ||
- digit > maxIntegerValue % 10) {
- return decodeDouble(token, decoded);
- }
- }
- value = value * 10 + digit;
- }
- if (isNegative && value == maxIntegerValue)
- decoded = Value::minLargestInt;
- else if (isNegative)
- decoded = -Value::LargestInt(value);
- else if (value <= Value::LargestUInt(Value::maxInt))
- decoded = Value::LargestInt(value);
- else
- decoded = value;
- return true;
- }
- bool Reader::decodeDouble(Token& token) {
- Value decoded;
- if (!decodeDouble(token, decoded))
- return false;
- currentValue().swapPayload(decoded);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- return true;
- }
- bool Reader::decodeDouble(Token& token, Value& decoded) {
- double value = 0;
- String buffer(token.start_, token.end_);
- IStringStream is(buffer);
- if (!(is >> value)) {
- if (value == std::numeric_limits<double>::max())
- value = std::numeric_limits<double>::infinity();
- else if (value == std::numeric_limits<double>::lowest())
- value = -std::numeric_limits<double>::infinity();
- else if (!std::isinf(value))
- return addError(
- "'" + String(token.start_, token.end_) + "' is not a number.", token);
- }
- decoded = value;
- return true;
- }
- bool Reader::decodeString(Token& token) {
- String decoded_string;
- if (!decodeString(token, decoded_string))
- return false;
- Value decoded(decoded_string);
- currentValue().swapPayload(decoded);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- return true;
- }
- bool Reader::decodeString(Token& token, String& decoded) {
- decoded.reserve(static_cast<size_t>(token.end_ - token.start_ - 2));
- Location current = token.start_ + 1; // skip '"'
- Location end = token.end_ - 1; // do not include '"'
- while (current != end) {
- Char c = *current++;
- if (c == '"')
- break;
- if (c == '\\') {
- if (current == end)
- return addError("Empty escape sequence in string", token, current);
- Char escape = *current++;
- switch (escape) {
- case '"':
- decoded += '"';
- break;
- case '/':
- decoded += '/';
- break;
- case '\\':
- decoded += '\\';
- break;
- case 'b':
- decoded += '\b';
- break;
- case 'f':
- decoded += '\f';
- break;
- case 'n':
- decoded += '\n';
- break;
- case 'r':
- decoded += '\r';
- break;
- case 't':
- decoded += '\t';
- break;
- case 'u': {
- unsigned int unicode;
- if (!decodeUnicodeCodePoint(token, current, end, unicode))
- return false;
- decoded += codePointToUTF8(unicode);
- } break;
- default:
- return addError("Bad escape sequence in string", token, current);
- }
- } else {
- decoded += c;
- }
- }
- return true;
- }
- bool Reader::decodeUnicodeCodePoint(Token& token, Location& current,
- Location end, unsigned int& unicode) {
- if (!decodeUnicodeEscapeSequence(token, current, end, unicode))
- return false;
- if (unicode >= 0xD800 && unicode <= 0xDBFF) {
- // surrogate pairs
- if (end - current < 6)
- return addError(
- "additional six characters expected to parse unicode surrogate pair.",
- token, current);
- if (*(current++) == '\\' && *(current++) == 'u') {
- unsigned int surrogatePair;
- if (decodeUnicodeEscapeSequence(token, current, end, surrogatePair)) {
- unicode = 0x10000 + ((unicode & 0x3FF) << 10) + (surrogatePair & 0x3FF);
- } else
- return false;
- } else
- return addError("expecting another \\u token to begin the second half of "
- "a unicode surrogate pair",
- token, current);
- }
- return true;
- }
- bool Reader::decodeUnicodeEscapeSequence(Token& token, Location& current,
- Location end,
- unsigned int& ret_unicode) {
- if (end - current < 4)
- return addError(
- "Bad unicode escape sequence in string: four digits expected.", token,
- current);
- int unicode = 0;
- for (int index = 0; index < 4; ++index) {
- Char c = *current++;
- unicode *= 16;
- if (c >= '0' && c <= '9')
- unicode += c - '0';
- else if (c >= 'a' && c <= 'f')
- unicode += c - 'a' + 10;
- else if (c >= 'A' && c <= 'F')
- unicode += c - 'A' + 10;
- else
- return addError(
- "Bad unicode escape sequence in string: hexadecimal digit expected.",
- token, current);
- }
- ret_unicode = static_cast<unsigned int>(unicode);
- return true;
- }
- bool Reader::addError(const String& message, Token& token, Location extra) {
- ErrorInfo info;
- info.token_ = token;
- info.message_ = message;
- info.extra_ = extra;
- errors_.push_back(info);
- return false;
- }
- bool Reader::recoverFromError(TokenType skipUntilToken) {
- size_t const errorCount = errors_.size();
- Token skip;
- for (;;) {
- if (!readToken(skip))
- errors_.resize(errorCount); // discard errors caused by recovery
- if (skip.type_ == skipUntilToken || skip.type_ == tokenEndOfStream)
- break;
- }
- errors_.resize(errorCount);
- return false;
- }
- bool Reader::addErrorAndRecover(const String& message, Token& token,
- TokenType skipUntilToken) {
- addError(message, token);
- return recoverFromError(skipUntilToken);
- }
- Value& Reader::currentValue() { return *(nodes_.top()); }
- Reader::Char Reader::getNextChar() {
- if (current_ == end_)
- return 0;
- return *current_++;
- }
- void Reader::getLocationLineAndColumn(Location location, int& line,
- int& column) const {
- Location current = begin_;
- Location lastLineStart = current;
- line = 0;
- while (current < location && current != end_) {
- Char c = *current++;
- if (c == '\r') {
- if (*current == '\n')
- ++current;
- lastLineStart = current;
- ++line;
- } else if (c == '\n') {
- lastLineStart = current;
- ++line;
- }
- }
- // column & line start at 1
- column = int(location - lastLineStart) + 1;
- ++line;
- }
- String Reader::getLocationLineAndColumn(Location location) const {
- int line, column;
- getLocationLineAndColumn(location, line, column);
- char buffer[18 + 16 + 16 + 1];
- jsoncpp_snprintf(buffer, sizeof(buffer), "Line %d, Column %d", line, column);
- return buffer;
- }
- // Deprecated. Preserved for backward compatibility
- String Reader::getFormatedErrorMessages() const {
- return getFormattedErrorMessages();
- }
- String Reader::getFormattedErrorMessages() const {
- String formattedMessage;
- for (const auto& error : errors_) {
- formattedMessage +=
- "* " + getLocationLineAndColumn(error.token_.start_) + "\n";
- formattedMessage += " " + error.message_ + "\n";
- if (error.extra_)
- formattedMessage +=
- "See " + getLocationLineAndColumn(error.extra_) + " for detail.\n";
- }
- return formattedMessage;
- }
- std::vector<Reader::StructuredError> Reader::getStructuredErrors() const {
- std::vector<Reader::StructuredError> allErrors;
- for (const auto& error : errors_) {
- Reader::StructuredError structured;
- structured.offset_start = error.token_.start_ - begin_;
- structured.offset_limit = error.token_.end_ - begin_;
- structured.message = error.message_;
- allErrors.push_back(structured);
- }
- return allErrors;
- }
- bool Reader::pushError(const Value& value, const String& message) {
- ptrdiff_t const length = end_ - begin_;
- if (value.getOffsetStart() > length || value.getOffsetLimit() > length)
- return false;
- Token token;
- token.type_ = tokenError;
- token.start_ = begin_ + value.getOffsetStart();
- token.end_ = begin_ + value.getOffsetLimit();
- ErrorInfo info;
- info.token_ = token;
- info.message_ = message;
- info.extra_ = nullptr;
- errors_.push_back(info);
- return true;
- }
- bool Reader::pushError(const Value& value, const String& message,
- const Value& extra) {
- ptrdiff_t const length = end_ - begin_;
- if (value.getOffsetStart() > length || value.getOffsetLimit() > length ||
- extra.getOffsetLimit() > length)
- return false;
- Token token;
- token.type_ = tokenError;
- token.start_ = begin_ + value.getOffsetStart();
- token.end_ = begin_ + value.getOffsetLimit();
- ErrorInfo info;
- info.token_ = token;
- info.message_ = message;
- info.extra_ = begin_ + extra.getOffsetStart();
- errors_.push_back(info);
- return true;
- }
- bool Reader::good() const { return errors_.empty(); }
- // Originally copied from the Features class (now deprecated), used internally
- // for features implementation.
- class OurFeatures {
- public:
- static OurFeatures all();
- bool allowComments_;
- bool allowTrailingCommas_;
- bool strictRoot_;
- bool allowDroppedNullPlaceholders_;
- bool allowNumericKeys_;
- bool allowSingleQuotes_;
- bool failIfExtra_;
- bool rejectDupKeys_;
- bool allowSpecialFloats_;
- bool skipBom_;
- size_t stackLimit_;
- }; // OurFeatures
- OurFeatures OurFeatures::all() { return {}; }
- // Implementation of class Reader
- // ////////////////////////////////
- // Originally copied from the Reader class (now deprecated), used internally
- // for implementing JSON reading.
- class OurReader {
- public:
- using Char = char;
- using Location = const Char*;
- struct StructuredError {
- ptrdiff_t offset_start;
- ptrdiff_t offset_limit;
- String message;
- };
- explicit OurReader(OurFeatures const& features);
- bool parse(const char* beginDoc, const char* endDoc, Value& root,
- bool collectComments = true);
- String getFormattedErrorMessages() const;
- std::vector<StructuredError> getStructuredErrors() const;
- private:
- OurReader(OurReader const&); // no impl
- void operator=(OurReader const&); // no impl
- enum TokenType {
- tokenEndOfStream = 0,
- tokenObjectBegin,
- tokenObjectEnd,
- tokenArrayBegin,
- tokenArrayEnd,
- tokenString,
- tokenNumber,
- tokenTrue,
- tokenFalse,
- tokenNull,
- tokenNaN,
- tokenPosInf,
- tokenNegInf,
- tokenArraySeparator,
- tokenMemberSeparator,
- tokenComment,
- tokenError
- };
- class Token {
- public:
- TokenType type_;
- Location start_;
- Location end_;
- };
- class ErrorInfo {
- public:
- Token token_;
- String message_;
- Location extra_;
- };
- using Errors = std::deque<ErrorInfo>;
- bool readToken(Token& token);
- void skipSpaces();
- void skipBom(bool skipBom);
- bool match(const Char* pattern, int patternLength);
- bool readComment();
- bool readCStyleComment(bool* containsNewLineResult);
- bool readCppStyleComment();
- bool readString();
- bool readStringSingleQuote();
- bool readNumber(bool checkInf);
- bool readValue();
- bool readObject(Token& token);
- bool readArray(Token& token);
- bool decodeNumber(Token& token);
- bool decodeNumber(Token& token, Value& decoded);
- bool decodeString(Token& token);
- bool decodeString(Token& token, String& decoded);
- bool decodeDouble(Token& token);
- bool decodeDouble(Token& token, Value& decoded);
- bool decodeUnicodeCodePoint(Token& token, Location& current, Location end,
- unsigned int& unicode);
- bool decodeUnicodeEscapeSequence(Token& token, Location& current,
- Location end, unsigned int& unicode);
- bool addError(const String& message, Token& token, Location extra = nullptr);
- bool recoverFromError(TokenType skipUntilToken);
- bool addErrorAndRecover(const String& message, Token& token,
- TokenType skipUntilToken);
- void skipUntilSpace();
- Value& currentValue();
- Char getNextChar();
- void getLocationLineAndColumn(Location location, int& line,
- int& column) const;
- String getLocationLineAndColumn(Location location) const;
- void addComment(Location begin, Location end, CommentPlacement placement);
- void skipCommentTokens(Token& token);
- static String normalizeEOL(Location begin, Location end);
- static bool containsNewLine(Location begin, Location end);
- using Nodes = std::stack<Value*>;
- Nodes nodes_{};
- Errors errors_{};
- String document_{};
- Location begin_ = nullptr;
- Location end_ = nullptr;
- Location current_ = nullptr;
- Location lastValueEnd_ = nullptr;
- Value* lastValue_ = nullptr;
- bool lastValueHasAComment_ = false;
- String commentsBefore_{};
- OurFeatures const features_;
- bool collectComments_ = false;
- }; // OurReader
- // complete copy of Read impl, for OurReader
- bool OurReader::containsNewLine(OurReader::Location begin,
- OurReader::Location end) {
- return std::any_of(begin, end, [](char b) { return b == '\n' || b == '\r'; });
- }
- OurReader::OurReader(OurFeatures const& features) : features_(features) {}
- bool OurReader::parse(const char* beginDoc, const char* endDoc, Value& root,
- bool collectComments) {
- if (!features_.allowComments_) {
- collectComments = false;
- }
- begin_ = beginDoc;
- end_ = endDoc;
- collectComments_ = collectComments;
- current_ = begin_;
- lastValueEnd_ = nullptr;
- lastValue_ = nullptr;
- commentsBefore_.clear();
- errors_.clear();
- while (!nodes_.empty())
- nodes_.pop();
- nodes_.push(&root);
- // skip byte order mark if it exists at the beginning of the UTF-8 text.
- skipBom(features_.skipBom_);
- bool successful = readValue();
- nodes_.pop();
- Token token;
- skipCommentTokens(token);
- if (features_.failIfExtra_ && (token.type_ != tokenEndOfStream)) {
- addError("Extra non-whitespace after JSON value.", token);
- return false;
- }
- if (collectComments_ && !commentsBefore_.empty())
- root.setComment(commentsBefore_, commentAfter);
- if (features_.strictRoot_) {
- if (!root.isArray() && !root.isObject()) {
- // Set error location to start of doc, ideally should be first token found
- // in doc
- token.type_ = tokenError;
- token.start_ = beginDoc;
- token.end_ = endDoc;
- addError(
- "A valid JSON document must be either an array or an object value.",
- token);
- return false;
- }
- }
- return successful;
- }
- bool OurReader::readValue() {
- // To preserve the old behaviour we cast size_t to int.
- if (nodes_.size() > features_.stackLimit_)
- throwRuntimeError("Exceeded stackLimit in readValue().");
- Token token;
- skipCommentTokens(token);
- bool successful = true;
- if (collectComments_ && !commentsBefore_.empty()) {
- currentValue().setComment(commentsBefore_, commentBefore);
- commentsBefore_.clear();
- }
- switch (token.type_) {
- case tokenObjectBegin:
- successful = readObject(token);
- currentValue().setOffsetLimit(current_ - begin_);
- break;
- case tokenArrayBegin:
- successful = readArray(token);
- currentValue().setOffsetLimit(current_ - begin_);
- break;
- case tokenNumber:
- successful = decodeNumber(token);
- break;
- case tokenString:
- successful = decodeString(token);
- break;
- case tokenTrue: {
- Value v(true);
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- } break;
- case tokenFalse: {
- Value v(false);
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- } break;
- case tokenNull: {
- Value v;
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- } break;
- case tokenNaN: {
- Value v(std::numeric_limits<double>::quiet_NaN());
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- } break;
- case tokenPosInf: {
- Value v(std::numeric_limits<double>::infinity());
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- } break;
- case tokenNegInf: {
- Value v(-std::numeric_limits<double>::infinity());
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- } break;
- case tokenArraySeparator:
- case tokenObjectEnd:
- case tokenArrayEnd:
- if (features_.allowDroppedNullPlaceholders_) {
- // "Un-read" the current token and mark the current value as a null
- // token.
- current_--;
- Value v;
- currentValue().swapPayload(v);
- currentValue().setOffsetStart(current_ - begin_ - 1);
- currentValue().setOffsetLimit(current_ - begin_);
- break;
- } // else, fall through ...
- default:
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- return addError("Syntax error: value, object or array expected.", token);
- }
- if (collectComments_) {
- lastValueEnd_ = current_;
- lastValueHasAComment_ = false;
- lastValue_ = ¤tValue();
- }
- return successful;
- }
- void OurReader::skipCommentTokens(Token& token) {
- if (features_.allowComments_) {
- do {
- readToken(token);
- } while (token.type_ == tokenComment);
- } else {
- readToken(token);
- }
- }
- bool OurReader::readToken(Token& token) {
- skipSpaces();
- token.start_ = current_;
- Char c = getNextChar();
- bool ok = true;
- switch (c) {
- case '{':
- token.type_ = tokenObjectBegin;
- break;
- case '}':
- token.type_ = tokenObjectEnd;
- break;
- case '[':
- token.type_ = tokenArrayBegin;
- break;
- case ']':
- token.type_ = tokenArrayEnd;
- break;
- case '"':
- token.type_ = tokenString;
- ok = readString();
- break;
- case '\'':
- if (features_.allowSingleQuotes_) {
- token.type_ = tokenString;
- ok = readStringSingleQuote();
- } else {
- // If we don't allow single quotes, this is a failure case.
- ok = false;
- }
- break;
- case '/':
- token.type_ = tokenComment;
- ok = readComment();
- break;
- case '0':
- case '1':
- case '2':
- case '3':
- case '4':
- case '5':
- case '6':
- case '7':
- case '8':
- case '9':
- token.type_ = tokenNumber;
- readNumber(false);
- break;
- case '-':
- if (readNumber(true)) {
- token.type_ = tokenNumber;
- } else {
- token.type_ = tokenNegInf;
- ok = features_.allowSpecialFloats_ && match("nfinity", 7);
- }
- break;
- case '+':
- if (readNumber(true)) {
- token.type_ = tokenNumber;
- } else {
- token.type_ = tokenPosInf;
- ok = features_.allowSpecialFloats_ && match("nfinity", 7);
- }
- break;
- case 't':
- token.type_ = tokenTrue;
- ok = match("rue", 3);
- break;
- case 'f':
- token.type_ = tokenFalse;
- ok = match("alse", 4);
- break;
- case 'n':
- token.type_ = tokenNull;
- ok = match("ull", 3);
- break;
- case 'N':
- if (features_.allowSpecialFloats_) {
- token.type_ = tokenNaN;
- ok = match("aN", 2);
- } else {
- ok = false;
- }
- break;
- case 'I':
- if (features_.allowSpecialFloats_) {
- token.type_ = tokenPosInf;
- ok = match("nfinity", 7);
- } else {
- ok = false;
- }
- break;
- case ',':
- token.type_ = tokenArraySeparator;
- break;
- case ':':
- token.type_ = tokenMemberSeparator;
- break;
- case 0:
- token.type_ = tokenEndOfStream;
- break;
- default:
- ok = false;
- break;
- }
- if (!ok)
- token.type_ = tokenError;
- token.end_ = current_;
- return ok;
- }
- void OurReader::skipSpaces() {
- while (current_ != end_) {
- Char c = *current_;
- if (c == ' ' || c == '\t' || c == '\r' || c == '\n')
- ++current_;
- else
- break;
- }
- }
- void OurReader::skipBom(bool skipBom) {
- // The default behavior is to skip BOM.
- if (skipBom) {
- if ((end_ - begin_) >= 3 && strncmp(begin_, "\xEF\xBB\xBF", 3) == 0) {
- begin_ += 3;
- current_ = begin_;
- }
- }
- }
- bool OurReader::match(const Char* pattern, int patternLength) {
- if (end_ - current_ < patternLength)
- return false;
- int index = patternLength;
- while (index--)
- if (current_[index] != pattern[index])
- return false;
- current_ += patternLength;
- return true;
- }
- bool OurReader::readComment() {
- const Location commentBegin = current_ - 1;
- const Char c = getNextChar();
- bool successful = false;
- bool cStyleWithEmbeddedNewline = false;
- const bool isCStyleComment = (c == '*');
- const bool isCppStyleComment = (c == '/');
- if (isCStyleComment) {
- successful = readCStyleComment(&cStyleWithEmbeddedNewline);
- } else if (isCppStyleComment) {
- successful = readCppStyleComment();
- }
- if (!successful)
- return false;
- if (collectComments_) {
- CommentPlacement placement = commentBefore;
- if (!lastValueHasAComment_) {
- if (lastValueEnd_ && !containsNewLine(lastValueEnd_, commentBegin)) {
- if (isCppStyleComment || !cStyleWithEmbeddedNewline) {
- placement = commentAfterOnSameLine;
- lastValueHasAComment_ = true;
- }
- }
- }
- addComment(commentBegin, current_, placement);
- }
- return true;
- }
- String OurReader::normalizeEOL(OurReader::Location begin,
- OurReader::Location end) {
- String normalized;
- normalized.reserve(static_cast<size_t>(end - begin));
- OurReader::Location current = begin;
- while (current != end) {
- char c = *current++;
- if (c == '\r') {
- if (current != end && *current == '\n')
- // convert dos EOL
- ++current;
- // convert Mac EOL
- normalized += '\n';
- } else {
- normalized += c;
- }
- }
- return normalized;
- }
- void OurReader::addComment(Location begin, Location end,
- CommentPlacement placement) {
- assert(collectComments_);
- const String& normalized = normalizeEOL(begin, end);
- if (placement == commentAfterOnSameLine) {
- assert(lastValue_ != nullptr);
- lastValue_->setComment(normalized, placement);
- } else {
- commentsBefore_ += normalized;
- }
- }
- bool OurReader::readCStyleComment(bool* containsNewLineResult) {
- *containsNewLineResult = false;
- while ((current_ + 1) < end_) {
- Char c = getNextChar();
- if (c == '*' && *current_ == '/')
- break;
- if (c == '\n')
- *containsNewLineResult = true;
- }
- return getNextChar() == '/';
- }
- bool OurReader::readCppStyleComment() {
- while (current_ != end_) {
- Char c = getNextChar();
- if (c == '\n')
- break;
- if (c == '\r') {
- // Consume DOS EOL. It will be normalized in addComment.
- if (current_ != end_ && *current_ == '\n')
- getNextChar();
- // Break on Moc OS 9 EOL.
- break;
- }
- }
- return true;
- }
- bool OurReader::readNumber(bool checkInf) {
- Location p = current_;
- if (checkInf && p != end_ && *p == 'I') {
- current_ = ++p;
- return false;
- }
- char c = '0'; // stopgap for already consumed character
- // integral part
- while (c >= '0' && c <= '9')
- c = (current_ = p) < end_ ? *p++ : '\0';
- // fractional part
- if (c == '.') {
- c = (current_ = p) < end_ ? *p++ : '\0';
- while (c >= '0' && c <= '9')
- c = (current_ = p) < end_ ? *p++ : '\0';
- }
- // exponential part
- if (c == 'e' || c == 'E') {
- c = (current_ = p) < end_ ? *p++ : '\0';
- if (c == '+' || c == '-')
- c = (current_ = p) < end_ ? *p++ : '\0';
- while (c >= '0' && c <= '9')
- c = (current_ = p) < end_ ? *p++ : '\0';
- }
- return true;
- }
- bool OurReader::readString() {
- Char c = 0;
- while (current_ != end_) {
- c = getNextChar();
- if (c == '\\')
- getNextChar();
- else if (c == '"')
- break;
- }
- return c == '"';
- }
- bool OurReader::readStringSingleQuote() {
- Char c = 0;
- while (current_ != end_) {
- c = getNextChar();
- if (c == '\\')
- getNextChar();
- else if (c == '\'')
- break;
- }
- return c == '\'';
- }
- bool OurReader::readObject(Token& token) {
- Token tokenName;
- String name;
- Value init(objectValue);
- currentValue().swapPayload(init);
- currentValue().setOffsetStart(token.start_ - begin_);
- while (readToken(tokenName)) {
- bool initialTokenOk = true;
- while (tokenName.type_ == tokenComment && initialTokenOk)
- initialTokenOk = readToken(tokenName);
- if (!initialTokenOk)
- break;
- if (tokenName.type_ == tokenObjectEnd &&
- (name.empty() ||
- features_.allowTrailingCommas_)) // empty object or trailing comma
- return true;
- name.clear();
- if (tokenName.type_ == tokenString) {
- if (!decodeString(tokenName, name))
- return recoverFromError(tokenObjectEnd);
- } else if (tokenName.type_ == tokenNumber && features_.allowNumericKeys_) {
- Value numberName;
- if (!decodeNumber(tokenName, numberName))
- return recoverFromError(tokenObjectEnd);
- name = numberName.asString();
- } else {
- break;
- }
- if (name.length() >= (1U << 30))
- throwRuntimeError("keylength >= 2^30");
- if (features_.rejectDupKeys_ && currentValue().isMember(name)) {
- String msg = "Duplicate key: '" + name + "'";
- return addErrorAndRecover(msg, tokenName, tokenObjectEnd);
- }
- Token colon;
- if (!readToken(colon) || colon.type_ != tokenMemberSeparator) {
- return addErrorAndRecover("Missing ':' after object member name", colon,
- tokenObjectEnd);
- }
- Value& value = currentValue()[name];
- nodes_.push(&value);
- bool ok = readValue();
- nodes_.pop();
- if (!ok) // error already set
- return recoverFromError(tokenObjectEnd);
- Token comma;
- if (!readToken(comma) ||
- (comma.type_ != tokenObjectEnd && comma.type_ != tokenArraySeparator &&
- comma.type_ != tokenComment)) {
- return addErrorAndRecover("Missing ',' or '}' in object declaration",
- comma, tokenObjectEnd);
- }
- bool finalizeTokenOk = true;
- while (comma.type_ == tokenComment && finalizeTokenOk)
- finalizeTokenOk = readToken(comma);
- if (comma.type_ == tokenObjectEnd)
- return true;
- }
- return addErrorAndRecover("Missing '}' or object member name", tokenName,
- tokenObjectEnd);
- }
- bool OurReader::readArray(Token& token) {
- Value init(arrayValue);
- currentValue().swapPayload(init);
- currentValue().setOffsetStart(token.start_ - begin_);
- int index = 0;
- for (;;) {
- skipSpaces();
- if (current_ != end_ && *current_ == ']' &&
- (index == 0 ||
- (features_.allowTrailingCommas_ &&
- !features_.allowDroppedNullPlaceholders_))) // empty array or trailing
- // comma
- {
- Token endArray;
- readToken(endArray);
- return true;
- }
- Value& value = currentValue()[index++];
- nodes_.push(&value);
- bool ok = readValue();
- nodes_.pop();
- if (!ok) // error already set
- return recoverFromError(tokenArrayEnd);
- Token currentToken;
- // Accept Comment after last item in the array.
- ok = readToken(currentToken);
- while (currentToken.type_ == tokenComment && ok) {
- ok = readToken(currentToken);
- }
- bool badTokenType = (currentToken.type_ != tokenArraySeparator &&
- currentToken.type_ != tokenArrayEnd);
- if (!ok || badTokenType) {
- return addErrorAndRecover("Missing ',' or ']' in array declaration",
- currentToken, tokenArrayEnd);
- }
- if (currentToken.type_ == tokenArrayEnd)
- break;
- }
- return true;
- }
- bool OurReader::decodeNumber(Token& token) {
- Value decoded;
- if (!decodeNumber(token, decoded))
- return false;
- currentValue().swapPayload(decoded);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- return true;
- }
- bool OurReader::decodeNumber(Token& token, Value& decoded) {
- // Attempts to parse the number as an integer. If the number is
- // larger than the maximum supported value of an integer then
- // we decode the number as a double.
- Location current = token.start_;
- const bool isNegative = *current == '-';
- if (isNegative) {
- ++current;
- }
- // We assume we can represent the largest and smallest integer types as
- // unsigned integers with separate sign. This is only true if they can fit
- // into an unsigned integer.
- static_assert(Value::maxLargestInt <= Value::maxLargestUInt,
- "Int must be smaller than UInt");
- // We need to convert minLargestInt into a positive number. The easiest way
- // to do this conversion is to assume our "threshold" value of minLargestInt
- // divided by 10 can fit in maxLargestInt when absolute valued. This should
- // be a safe assumption.
- static_assert(Value::minLargestInt <= -Value::maxLargestInt,
- "The absolute value of minLargestInt must be greater than or "
- "equal to maxLargestInt");
- static_assert(Value::minLargestInt / 10 >= -Value::maxLargestInt,
- "The absolute value of minLargestInt must be only 1 magnitude "
- "larger than maxLargest Int");
- static constexpr Value::LargestUInt positive_threshold =
- Value::maxLargestUInt / 10;
- static constexpr Value::UInt positive_last_digit = Value::maxLargestUInt % 10;
- // For the negative values, we have to be more careful. Since typically
- // -Value::minLargestInt will cause an overflow, we first divide by 10 and
- // then take the inverse. This assumes that minLargestInt is only a single
- // power of 10 different in magnitude, which we check above. For the last
- // digit, we take the modulus before negating for the same reason.
- static constexpr auto negative_threshold =
- Value::LargestUInt(-(Value::minLargestInt / 10));
- static constexpr auto negative_last_digit =
- Value::UInt(-(Value::minLargestInt % 10));
- const Value::LargestUInt threshold =
- isNegative ? negative_threshold : positive_threshold;
- const Value::UInt max_last_digit =
- isNegative ? negative_last_digit : positive_last_digit;
- Value::LargestUInt value = 0;
- while (current < token.end_) {
- Char c = *current++;
- if (c < '0' || c > '9')
- return decodeDouble(token, decoded);
- const auto digit(static_cast<Value::UInt>(c - '0'));
- if (value >= threshold) {
- // We've hit or exceeded the max value divided by 10 (rounded down). If
- // a) we've only just touched the limit, meaning value == threshold,
- // b) this is the last digit, or
- // c) it's small enough to fit in that rounding delta, we're okay.
- // Otherwise treat this number as a double to avoid overflow.
- if (value > threshold || current != token.end_ ||
- digit > max_last_digit) {
- return decodeDouble(token, decoded);
- }
- }
- value = value * 10 + digit;
- }
- if (isNegative) {
- // We use the same magnitude assumption here, just in case.
- const auto last_digit = static_cast<Value::UInt>(value % 10);
- decoded = -Value::LargestInt(value / 10) * 10 - last_digit;
- } else if (value <= Value::LargestUInt(Value::maxLargestInt)) {
- decoded = Value::LargestInt(value);
- } else {
- decoded = value;
- }
- return true;
- }
- bool OurReader::decodeDouble(Token& token) {
- Value decoded;
- if (!decodeDouble(token, decoded))
- return false;
- currentValue().swapPayload(decoded);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- return true;
- }
- bool OurReader::decodeDouble(Token& token, Value& decoded) {
- double value = 0;
- const String buffer(token.start_, token.end_);
- IStringStream is(buffer);
- if (!(is >> value)) {
- if (value == std::numeric_limits<double>::max())
- value = std::numeric_limits<double>::infinity();
- else if (value == std::numeric_limits<double>::lowest())
- value = -std::numeric_limits<double>::infinity();
- else if (!std::isinf(value))
- return addError(
- "'" + String(token.start_, token.end_) + "' is not a number.", token);
- }
- decoded = value;
- return true;
- }
- bool OurReader::decodeString(Token& token) {
- String decoded_string;
- if (!decodeString(token, decoded_string))
- return false;
- Value decoded(decoded_string);
- currentValue().swapPayload(decoded);
- currentValue().setOffsetStart(token.start_ - begin_);
- currentValue().setOffsetLimit(token.end_ - begin_);
- return true;
- }
- bool OurReader::decodeString(Token& token, String& decoded) {
- decoded.reserve(static_cast<size_t>(token.end_ - token.start_ - 2));
- Location current = token.start_ + 1; // skip '"'
- Location end = token.end_ - 1; // do not include '"'
- while (current != end) {
- Char c = *current++;
- if (c == '"')
- break;
- if (c == '\\') {
- if (current == end)
- return addError("Empty escape sequence in string", token, current);
- Char escape = *current++;
- switch (escape) {
- case '"':
- decoded += '"';
- break;
- case '/':
- decoded += '/';
- break;
- case '\\':
- decoded += '\\';
- break;
- case 'b':
- decoded += '\b';
- break;
- case 'f':
- decoded += '\f';
- break;
- case 'n':
- decoded += '\n';
- break;
- case 'r':
- decoded += '\r';
- break;
- case 't':
- decoded += '\t';
- break;
- case 'u': {
- unsigned int unicode;
- if (!decodeUnicodeCodePoint(token, current, end, unicode))
- return false;
- decoded += codePointToUTF8(unicode);
- } break;
- default:
- return addError("Bad escape sequence in string", token, current);
- }
- } else {
- decoded += c;
- }
- }
- return true;
- }
- bool OurReader::decodeUnicodeCodePoint(Token& token, Location& current,
- Location end, unsigned int& unicode) {
- if (!decodeUnicodeEscapeSequence(token, current, end, unicode))
- return false;
- if (unicode >= 0xD800 && unicode <= 0xDBFF) {
- // surrogate pairs
- if (end - current < 6)
- return addError(
- "additional six characters expected to parse unicode surrogate pair.",
- token, current);
- if (*(current++) == '\\' && *(current++) == 'u') {
- unsigned int surrogatePair;
- if (decodeUnicodeEscapeSequence(token, current, end, surrogatePair)) {
- unicode = 0x10000 + ((unicode & 0x3FF) << 10) + (surrogatePair & 0x3FF);
- } else
- return false;
- } else
- return addError("expecting another \\u token to begin the second half of "
- "a unicode surrogate pair",
- token, current);
- }
- return true;
- }
- bool OurReader::decodeUnicodeEscapeSequence(Token& token, Location& current,
- Location end,
- unsigned int& ret_unicode) {
- if (end - current < 4)
- return addError(
- "Bad unicode escape sequence in string: four digits expected.", token,
- current);
- int unicode = 0;
- for (int index = 0; index < 4; ++index) {
- Char c = *current++;
- unicode *= 16;
- if (c >= '0' && c <= '9')
- unicode += c - '0';
- else if (c >= 'a' && c <= 'f')
- unicode += c - 'a' + 10;
- else if (c >= 'A' && c <= 'F')
- unicode += c - 'A' + 10;
- else
- return addError(
- "Bad unicode escape sequence in string: hexadecimal digit expected.",
- token, current);
- }
- ret_unicode = static_cast<unsigned int>(unicode);
- return true;
- }
- bool OurReader::addError(const String& message, Token& token, Location extra) {
- ErrorInfo info;
- info.token_ = token;
- info.message_ = message;
- info.extra_ = extra;
- errors_.push_back(info);
- return false;
- }
- bool OurReader::recoverFromError(TokenType skipUntilToken) {
- size_t errorCount = errors_.size();
- Token skip;
- for (;;) {
- if (!readToken(skip))
- errors_.resize(errorCount); // discard errors caused by recovery
- if (skip.type_ == skipUntilToken || skip.type_ == tokenEndOfStream)
- break;
- }
- errors_.resize(errorCount);
- return false;
- }
- bool OurReader::addErrorAndRecover(const String& message, Token& token,
- TokenType skipUntilToken) {
- addError(message, token);
- return recoverFromError(skipUntilToken);
- }
- Value& OurReader::currentValue() { return *(nodes_.top()); }
- OurReader::Char OurReader::getNextChar() {
- if (current_ == end_)
- return 0;
- return *current_++;
- }
- void OurReader::getLocationLineAndColumn(Location location, int& line,
- int& column) const {
- Location current = begin_;
- Location lastLineStart = current;
- line = 0;
- while (current < location && current != end_) {
- Char c = *current++;
- if (c == '\r') {
- if (*current == '\n')
- ++current;
- lastLineStart = current;
- ++line;
- } else if (c == '\n') {
- lastLineStart = current;
- ++line;
- }
- }
- // column & line start at 1
- column = int(location - lastLineStart) + 1;
- ++line;
- }
- String OurReader::getLocationLineAndColumn(Location location) const {
- int line, column;
- getLocationLineAndColumn(location, line, column);
- char buffer[18 + 16 + 16 + 1];
- jsoncpp_snprintf(buffer, sizeof(buffer), "Line %d, Column %d", line, column);
- return buffer;
- }
- String OurReader::getFormattedErrorMessages() const {
- String formattedMessage;
- for (const auto& error : errors_) {
- formattedMessage +=
- "* " + getLocationLineAndColumn(error.token_.start_) + "\n";
- formattedMessage += " " + error.message_ + "\n";
- if (error.extra_)
- formattedMessage +=
- "See " + getLocationLineAndColumn(error.extra_) + " for detail.\n";
- }
- return formattedMessage;
- }
- std::vector<OurReader::StructuredError> OurReader::getStructuredErrors() const {
- std::vector<OurReader::StructuredError> allErrors;
- for (const auto& error : errors_) {
- OurReader::StructuredError structured;
- structured.offset_start = error.token_.start_ - begin_;
- structured.offset_limit = error.token_.end_ - begin_;
- structured.message = error.message_;
- allErrors.push_back(structured);
- }
- return allErrors;
- }
- class OurCharReader : public CharReader {
- bool const collectComments_;
- OurReader reader_;
- public:
- OurCharReader(bool collectComments, OurFeatures const& features)
- : collectComments_(collectComments), reader_(features) {}
- bool parse(char const* beginDoc, char const* endDoc, Value* root,
- String* errs) override {
- bool ok = reader_.parse(beginDoc, endDoc, *root, collectComments_);
- if (errs) {
- *errs = reader_.getFormattedErrorMessages();
- }
- return ok;
- }
- };
- CharReaderBuilder::CharReaderBuilder() { setDefaults(&settings_); }
- CharReaderBuilder::~CharReaderBuilder() = default;
- CharReader* CharReaderBuilder::newCharReader() const {
- bool collectComments = settings_["collectComments"].asBool();
- OurFeatures features = OurFeatures::all();
- features.allowComments_ = settings_["allowComments"].asBool();
- features.allowTrailingCommas_ = settings_["allowTrailingCommas"].asBool();
- features.strictRoot_ = settings_["strictRoot"].asBool();
- features.allowDroppedNullPlaceholders_ =
- settings_["allowDroppedNullPlaceholders"].asBool();
- features.allowNumericKeys_ = settings_["allowNumericKeys"].asBool();
- features.allowSingleQuotes_ = settings_["allowSingleQuotes"].asBool();
- // Stack limit is always a size_t, so we get this as an unsigned int
- // regardless of it we have 64-bit integer support enabled.
- features.stackLimit_ = static_cast<size_t>(settings_["stackLimit"].asUInt());
- features.failIfExtra_ = settings_["failIfExtra"].asBool();
- features.rejectDupKeys_ = settings_["rejectDupKeys"].asBool();
- features.allowSpecialFloats_ = settings_["allowSpecialFloats"].asBool();
- features.skipBom_ = settings_["skipBom"].asBool();
- return new OurCharReader(collectComments, features);
- }
- bool CharReaderBuilder::validate(Json::Value* invalid) const {
- static const auto& valid_keys = *new std::set<String>{
- "collectComments",
- "allowComments",
- "allowTrailingCommas",
- "strictRoot",
- "allowDroppedNullPlaceholders",
- "allowNumericKeys",
- "allowSingleQuotes",
- "stackLimit",
- "failIfExtra",
- "rejectDupKeys",
- "allowSpecialFloats",
- "skipBom",
- };
- for (auto si = settings_.begin(); si != settings_.end(); ++si) {
- auto key = si.name();
- if (valid_keys.count(key))
- continue;
- if (invalid)
- (*invalid)[key] = *si;
- else
- return false;
- }
- return invalid ? invalid->empty() : true;
- }
- Value& CharReaderBuilder::operator[](const String& key) {
- return settings_[key];
- }
- // static
- void CharReaderBuilder::strictMode(Json::Value* settings) {
- //! [CharReaderBuilderStrictMode]
- (*settings)["allowComments"] = false;
- (*settings)["allowTrailingCommas"] = false;
- (*settings)["strictRoot"] = true;
- (*settings)["allowDroppedNullPlaceholders"] = false;
- (*settings)["allowNumericKeys"] = false;
- (*settings)["allowSingleQuotes"] = false;
- (*settings)["stackLimit"] = 1000;
- (*settings)["failIfExtra"] = true;
- (*settings)["rejectDupKeys"] = true;
- (*settings)["allowSpecialFloats"] = false;
- (*settings)["skipBom"] = true;
- //! [CharReaderBuilderStrictMode]
- }
- // static
- void CharReaderBuilder::setDefaults(Json::Value* settings) {
- //! [CharReaderBuilderDefaults]
- (*settings)["collectComments"] = true;
- (*settings)["allowComments"] = true;
- (*settings)["allowTrailingCommas"] = true;
- (*settings)["strictRoot"] = false;
- (*settings)["allowDroppedNullPlaceholders"] = false;
- (*settings)["allowNumericKeys"] = false;
- (*settings)["allowSingleQuotes"] = false;
- (*settings)["stackLimit"] = 1000;
- (*settings)["failIfExtra"] = false;
- (*settings)["rejectDupKeys"] = false;
- (*settings)["allowSpecialFloats"] = false;
- (*settings)["skipBom"] = true;
- //! [CharReaderBuilderDefaults]
- }
- //////////////////////////////////
- // global functions
- bool parseFromStream(CharReader::Factory const& fact, IStream& sin, Value* root,
- String* errs) {
- OStringStream ssin;
- ssin << sin.rdbuf();
- String doc = ssin.str();
- char const* begin = doc.data();
- char const* end = begin + doc.size();
- // Note that we do not actually need a null-terminator.
- CharReaderPtr const reader(fact.newCharReader());
- return reader->parse(begin, end, root, errs);
- }
- IStream& operator>>(IStream& sin, Value& root) {
- CharReaderBuilder b;
- String errs;
- bool ok = parseFromStream(b, sin, &root, &errs);
- if (!ok) {
- throwRuntimeError(errs);
- }
- return sin;
- }
- } // namespace Json
|