2
0

reader.h 61 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510
  1. // Tencent is pleased to support the open source community by making RapidJSON available.
  2. //
  3. // Copyright (C) 2015 THL A29 Limited, a Tencent company, and Milo Yip. All rights reserved.
  4. //
  5. // Licensed under the MIT License (the "License"); you may not use this file except
  6. // in compliance with the License. You may obtain a copy of the License at
  7. //
  8. // http://opensource.org/licenses/MIT
  9. //
  10. // Unless required by applicable law or agreed to in writing, software distributed
  11. // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
  12. // CONDITIONS OF ANY KIND, either express or implied. See the License for the
  13. // specific language governing permissions and limitations under the License.
  14. #ifndef RAPIDJSON_READER_H_
  15. #define RAPIDJSON_READER_H_
  16. /*! \file reader.h */
  17. #include "rapidjson.h"
  18. #include "encodings.h"
  19. #include "internal/meta.h"
  20. #include "internal/stack.h"
  21. #include "internal/strtod.h"
  22. #if defined(RAPIDJSON_SIMD) && defined(_MSC_VER)
  23. #include <intrin.h>
  24. #pragma intrinsic(_BitScanForward)
  25. #endif
  26. #ifdef RAPIDJSON_SSE42
  27. #include <nmmintrin.h>
  28. #elif defined(RAPIDJSON_SSE2)
  29. #include <emmintrin.h>
  30. #endif
  31. #ifdef _MSC_VER
  32. RAPIDJSON_DIAG_PUSH
  33. RAPIDJSON_DIAG_OFF(4127) // conditional expression is constant
  34. RAPIDJSON_DIAG_OFF(4702) // unreachable code
  35. #endif
  36. #ifdef __GNUC__
  37. RAPIDJSON_DIAG_PUSH
  38. RAPIDJSON_DIAG_OFF(effc++)
  39. #endif
  40. //!@cond RAPIDJSON_HIDDEN_FROM_DOXYGEN
  41. #define RAPIDJSON_NOTHING /* deliberately empty */
  42. #ifndef RAPIDJSON_PARSE_ERROR_EARLY_RETURN
  43. #define RAPIDJSON_PARSE_ERROR_EARLY_RETURN(value) \
  44. RAPIDJSON_MULTILINEMACRO_BEGIN \
  45. if (HasParseError()) { return value; } \
  46. RAPIDJSON_MULTILINEMACRO_END
  47. #endif
  48. #define RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID \
  49. RAPIDJSON_PARSE_ERROR_EARLY_RETURN(RAPIDJSON_NOTHING)
  50. //!@endcond
  51. /*! \def RAPIDJSON_PARSE_ERROR_NORETURN
  52. \ingroup RAPIDJSON_ERRORS
  53. \brief Macro to indicate a parse error.
  54. \param parseErrorCode \ref rapidjson::ParseErrorCode of the error
  55. \param offset position of the error in JSON input (\c size_t)
  56. This macros can be used as a customization point for the internal
  57. error handling mechanism of RapidJSON.
  58. A common usage model is to throw an exception instead of requiring the
  59. caller to explicitly check the \ref rapidjson::GenericReader::Parse's
  60. return value:
  61. \code
  62. #define RAPIDJSON_PARSE_ERROR_NORETURN(parseErrorCode,offset) \
  63. throw ParseException(parseErrorCode, #parseErrorCode, offset)
  64. #include <stdexcept> // std::runtime_error
  65. #include "rapidjson/error/error.h" // rapidjson::ParseResult
  66. struct ParseException : std::runtime_error, rapidjson::ParseResult {
  67. ParseException(rapidjson::ParseErrorCode code, const char* msg, size_t offset)
  68. : std::runtime_error(msg), ParseResult(code, offset) {}
  69. };
  70. #include "rapidjson/reader.h"
  71. \endcode
  72. \see RAPIDJSON_PARSE_ERROR, rapidjson::GenericReader::Parse
  73. */
  74. #ifndef RAPIDJSON_PARSE_ERROR_NORETURN
  75. #define RAPIDJSON_PARSE_ERROR_NORETURN(parseErrorCode, offset) \
  76. RAPIDJSON_MULTILINEMACRO_BEGIN \
  77. RAPIDJSON_ASSERT(!HasParseError()); /* Error can only be assigned once */ \
  78. SetParseError(parseErrorCode, offset); \
  79. RAPIDJSON_MULTILINEMACRO_END
  80. #endif
  81. /*! \def RAPIDJSON_PARSE_ERROR
  82. \ingroup RAPIDJSON_ERRORS
  83. \brief (Internal) macro to indicate and handle a parse error.
  84. \param parseErrorCode \ref rapidjson::ParseErrorCode of the error
  85. \param offset position of the error in JSON input (\c size_t)
  86. Invokes RAPIDJSON_PARSE_ERROR_NORETURN and stops the parsing.
  87. \see RAPIDJSON_PARSE_ERROR_NORETURN
  88. \hideinitializer
  89. */
  90. #ifndef RAPIDJSON_PARSE_ERROR
  91. #define RAPIDJSON_PARSE_ERROR(parseErrorCode, offset) \
  92. RAPIDJSON_MULTILINEMACRO_BEGIN \
  93. RAPIDJSON_PARSE_ERROR_NORETURN(parseErrorCode, offset); \
  94. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID; \
  95. RAPIDJSON_MULTILINEMACRO_END
  96. #endif
  97. #include "error/error.h" // ParseErrorCode, ParseResult
  98. RAPIDJSON_NAMESPACE_BEGIN
  99. ///////////////////////////////////////////////////////////////////////////////
  100. // ParseFlag
  101. /*! \def RAPIDJSON_PARSE_DEFAULT_FLAGS
  102. \ingroup RAPIDJSON_CONFIG
  103. \brief User-defined kParseDefaultFlags definition.
  104. User can define this as any \c ParseFlag combinations.
  105. */
  106. #ifndef RAPIDJSON_PARSE_DEFAULT_FLAGS
  107. #define RAPIDJSON_PARSE_DEFAULT_FLAGS kParseNoFlags
  108. #endif
  109. //! Combination of parseFlags
  110. /*! \see Reader::Parse, Document::Parse, Document::ParseInsitu, Document::ParseStream
  111. */
  112. enum ParseFlag {
  113. kParseNoFlags = 0, //!< No flags are set.
  114. kParseInsituFlag = 1, //!< In-situ(destructive) parsing.
  115. kParseValidateEncodingFlag = 2, //!< Validate encoding of JSON strings.
  116. kParseIterativeFlag = 4, //!< Iterative(constant complexity in terms of function call stack size) parsing.
  117. kParseStopWhenDoneFlag = 8, //!< After parsing a complete JSON root from stream, stop further processing the rest of stream. When this flag is used, parser will not generate kParseErrorDocumentRootNotSingular error.
  118. kParseFullPrecisionFlag = 16, //!< Parse number in full precision (but slower).
  119. kParseCommentsFlag = 32, //!< Allow one-line (//) and multi-line (/**/) comments.
  120. kParseDefaultFlags = RAPIDJSON_PARSE_DEFAULT_FLAGS //!< Default parse flags. Can be customized by defining RAPIDJSON_PARSE_DEFAULT_FLAGS
  121. };
  122. ///////////////////////////////////////////////////////////////////////////////
  123. // Handler
  124. /*! \class rapidjson::Handler
  125. \brief Concept for receiving events from GenericReader upon parsing.
  126. The functions return true if no error occurs. If they return false,
  127. the event publisher should terminate the process.
  128. \code
  129. concept Handler {
  130. typename Ch;
  131. bool Null();
  132. bool Bool(bool b);
  133. bool Int(int i);
  134. bool Uint(unsigned i);
  135. bool Int64(int64_t i);
  136. bool Uint64(uint64_t i);
  137. bool Double(double d);
  138. bool String(const Ch* str, SizeType length, bool copy);
  139. bool StartObject();
  140. bool Key(const Ch* str, SizeType length, bool copy);
  141. bool EndObject(SizeType memberCount);
  142. bool StartArray();
  143. bool EndArray(SizeType elementCount);
  144. };
  145. \endcode
  146. */
  147. ///////////////////////////////////////////////////////////////////////////////
  148. // BaseReaderHandler
  149. //! Default implementation of Handler.
  150. /*! This can be used as base class of any reader handler.
  151. \note implements Handler concept
  152. */
  153. template<typename Encoding = UTF8<>, typename Derived = void>
  154. struct BaseReaderHandler {
  155. typedef typename Encoding::Ch Ch;
  156. typedef typename internal::SelectIf<internal::IsSame<Derived, void>, BaseReaderHandler, Derived>::Type Override;
  157. bool Default() { return true; }
  158. bool Null() { return static_cast<Override&>(*this).Default(); }
  159. bool Bool(bool) { return static_cast<Override&>(*this).Default(); }
  160. bool Int(int) { return static_cast<Override&>(*this).Default(); }
  161. bool Uint(unsigned) { return static_cast<Override&>(*this).Default(); }
  162. bool Int64(int64_t) { return static_cast<Override&>(*this).Default(); }
  163. bool Uint64(uint64_t) { return static_cast<Override&>(*this).Default(); }
  164. bool Double(double) { return static_cast<Override&>(*this).Default(); }
  165. bool String(const Ch*, SizeType, bool) { return static_cast<Override&>(*this).Default(); }
  166. bool StartObject() { return static_cast<Override&>(*this).Default(); }
  167. bool Key(const Ch* str, SizeType len, bool copy) { return static_cast<Override&>(*this).String(str, len, copy); }
  168. bool EndObject(SizeType) { return static_cast<Override&>(*this).Default(); }
  169. bool StartArray() { return static_cast<Override&>(*this).Default(); }
  170. bool EndArray(SizeType) { return static_cast<Override&>(*this).Default(); }
  171. };
  172. ///////////////////////////////////////////////////////////////////////////////
  173. // StreamLocalCopy
  174. namespace internal {
  175. template<typename Stream, int = StreamTraits<Stream>::copyOptimization>
  176. class StreamLocalCopy;
  177. //! Do copy optimization.
  178. template<typename Stream>
  179. class StreamLocalCopy<Stream, 1> {
  180. public:
  181. StreamLocalCopy(Stream& original) : s(original), original_(original) {}
  182. ~StreamLocalCopy() { original_ = s; }
  183. Stream s;
  184. private:
  185. StreamLocalCopy& operator=(const StreamLocalCopy&) /* = delete */;
  186. Stream& original_;
  187. };
  188. //! Keep reference.
  189. template<typename Stream>
  190. class StreamLocalCopy<Stream, 0> {
  191. public:
  192. StreamLocalCopy(Stream& original) : s(original) {}
  193. Stream& s;
  194. private:
  195. StreamLocalCopy& operator=(const StreamLocalCopy&) /* = delete */;
  196. };
  197. } // namespace internal
  198. ///////////////////////////////////////////////////////////////////////////////
  199. // SkipWhitespace
  200. //! Skip the JSON white spaces in a stream.
  201. /*! \param is A input stream for skipping white spaces.
  202. \note This function has SSE2/SSE4.2 specialization.
  203. */
  204. template<typename InputStream>
  205. void SkipWhitespace(InputStream& is) {
  206. internal::StreamLocalCopy<InputStream> copy(is);
  207. InputStream& s(copy.s);
  208. while (s.Peek() == ' ' || s.Peek() == '\n' || s.Peek() == '\r' || s.Peek() == '\t')
  209. s.Take();
  210. }
  211. #ifdef RAPIDJSON_SSE42
  212. //! Skip whitespace with SSE 4.2 pcmpistrm instruction, testing 16 8-byte characters at once.
  213. inline const char *SkipWhitespace_SIMD(const char* p) {
  214. // Fast return for single non-whitespace
  215. if (*p == ' ' || *p == '\n' || *p == '\r' || *p == '\t')
  216. ++p;
  217. else
  218. return p;
  219. // 16-byte align to the next boundary
  220. const char* nextAligned = reinterpret_cast<const char*>((reinterpret_cast<size_t>(p) + 15) & ~15);
  221. while (p != nextAligned)
  222. if (*p == ' ' || *p == '\n' || *p == '\r' || *p == '\t')
  223. ++p;
  224. else
  225. return p;
  226. // The rest of string using SIMD
  227. static const char whitespace[16] = " \n\r\t";
  228. const __m128i w = _mm_loadu_si128((const __m128i *)&whitespace[0]);
  229. for (;; p += 16) {
  230. const __m128i s = _mm_load_si128((const __m128i *)p);
  231. const unsigned r = _mm_cvtsi128_si32(_mm_cmpistrm(w, s, _SIDD_UBYTE_OPS | _SIDD_CMP_EQUAL_ANY | _SIDD_BIT_MASK | _SIDD_NEGATIVE_POLARITY));
  232. if (r != 0) { // some of characters is non-whitespace
  233. #ifdef _MSC_VER // Find the index of first non-whitespace
  234. unsigned long offset;
  235. _BitScanForward(&offset, r);
  236. return p + offset;
  237. #else
  238. return p + __builtin_ffs(r) - 1;
  239. #endif
  240. }
  241. }
  242. }
  243. #elif defined(RAPIDJSON_SSE2)
  244. //! Skip whitespace with SSE2 instructions, testing 16 8-byte characters at once.
  245. inline const char *SkipWhitespace_SIMD(const char* p) {
  246. // Fast return for single non-whitespace
  247. if (*p == ' ' || *p == '\n' || *p == '\r' || *p == '\t')
  248. ++p;
  249. else
  250. return p;
  251. // 16-byte align to the next boundary
  252. const char* nextAligned = reinterpret_cast<const char*>((reinterpret_cast<size_t>(p) + 15) & ~15);
  253. while (p != nextAligned)
  254. if (*p == ' ' || *p == '\n' || *p == '\r' || *p == '\t')
  255. ++p;
  256. else
  257. return p;
  258. // The rest of string
  259. static const char whitespaces[4][17] = {
  260. " ",
  261. "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
  262. "\r\r\r\r\r\r\r\r\r\r\r\r\r\r\r\r",
  263. "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t"};
  264. const __m128i w0 = _mm_loadu_si128((const __m128i *)&whitespaces[0][0]);
  265. const __m128i w1 = _mm_loadu_si128((const __m128i *)&whitespaces[1][0]);
  266. const __m128i w2 = _mm_loadu_si128((const __m128i *)&whitespaces[2][0]);
  267. const __m128i w3 = _mm_loadu_si128((const __m128i *)&whitespaces[3][0]);
  268. for (;; p += 16) {
  269. const __m128i s = _mm_load_si128((const __m128i *)p);
  270. __m128i x = _mm_cmpeq_epi8(s, w0);
  271. x = _mm_or_si128(x, _mm_cmpeq_epi8(s, w1));
  272. x = _mm_or_si128(x, _mm_cmpeq_epi8(s, w2));
  273. x = _mm_or_si128(x, _mm_cmpeq_epi8(s, w3));
  274. unsigned short r = (unsigned short)~_mm_movemask_epi8(x);
  275. if (r != 0) { // some of characters may be non-whitespace
  276. #ifdef _MSC_VER // Find the index of first non-whitespace
  277. unsigned long offset;
  278. _BitScanForward(&offset, r);
  279. return p + offset;
  280. #else
  281. return p + __builtin_ffs(r) - 1;
  282. #endif
  283. }
  284. }
  285. }
  286. #endif // RAPIDJSON_SSE2
  287. #ifdef RAPIDJSON_SIMD
  288. //! Template function specialization for InsituStringStream
  289. template<> inline void SkipWhitespace(InsituStringStream& is) {
  290. is.src_ = const_cast<char*>(SkipWhitespace_SIMD(is.src_));
  291. }
  292. //! Template function specialization for StringStream
  293. template<> inline void SkipWhitespace(StringStream& is) {
  294. is.src_ = SkipWhitespace_SIMD(is.src_);
  295. }
  296. #endif // RAPIDJSON_SIMD
  297. ///////////////////////////////////////////////////////////////////////////////
  298. // GenericReader
  299. //! SAX-style JSON parser. Use \ref Reader for UTF8 encoding and default allocator.
  300. /*! GenericReader parses JSON text from a stream, and send events synchronously to an
  301. object implementing Handler concept.
  302. It needs to allocate a stack for storing a single decoded string during
  303. non-destructive parsing.
  304. For in-situ parsing, the decoded string is directly written to the source
  305. text string, no temporary buffer is required.
  306. A GenericReader object can be reused for parsing multiple JSON text.
  307. \tparam SourceEncoding Encoding of the input stream.
  308. \tparam TargetEncoding Encoding of the parse output.
  309. \tparam StackAllocator Allocator type for stack.
  310. */
  311. template <typename SourceEncoding, typename TargetEncoding, typename StackAllocator = CrtAllocator>
  312. class GenericReader {
  313. public:
  314. typedef typename SourceEncoding::Ch Ch; //!< SourceEncoding character type
  315. //! Constructor.
  316. /*! \param stackAllocator Optional allocator for allocating stack memory. (Only use for non-destructive parsing)
  317. \param stackCapacity stack capacity in bytes for storing a single decoded string. (Only use for non-destructive parsing)
  318. */
  319. GenericReader(StackAllocator* stackAllocator = 0, size_t stackCapacity = kDefaultStackCapacity) : stack_(stackAllocator, stackCapacity), parseResult_() {}
  320. //! Parse JSON text.
  321. /*! \tparam parseFlags Combination of \ref ParseFlag.
  322. \tparam InputStream Type of input stream, implementing Stream concept.
  323. \tparam Handler Type of handler, implementing Handler concept.
  324. \param is Input stream to be parsed.
  325. \param handler The handler to receive events.
  326. \return Whether the parsing is successful.
  327. */
  328. template <unsigned parseFlags, typename InputStream, typename Handler>
  329. ParseResult Parse(InputStream& is, Handler& handler) {
  330. if (parseFlags & kParseIterativeFlag)
  331. return IterativeParse<parseFlags>(is, handler);
  332. parseResult_.Clear();
  333. ClearStackOnExit scope(*this);
  334. SkipWhitespaceAndComments<parseFlags>(is);
  335. RAPIDJSON_PARSE_ERROR_EARLY_RETURN(parseResult_);
  336. if (is.Peek() == '\0') {
  337. RAPIDJSON_PARSE_ERROR_NORETURN(kParseErrorDocumentEmpty, is.Tell());
  338. RAPIDJSON_PARSE_ERROR_EARLY_RETURN(parseResult_);
  339. }
  340. else {
  341. ParseValue<parseFlags>(is, handler);
  342. RAPIDJSON_PARSE_ERROR_EARLY_RETURN(parseResult_);
  343. if (!(parseFlags & kParseStopWhenDoneFlag)) {
  344. SkipWhitespaceAndComments<parseFlags>(is);
  345. RAPIDJSON_PARSE_ERROR_EARLY_RETURN(parseResult_);
  346. if (is.Peek() != '\0') {
  347. RAPIDJSON_PARSE_ERROR_NORETURN(kParseErrorDocumentRootNotSingular, is.Tell());
  348. RAPIDJSON_PARSE_ERROR_EARLY_RETURN(parseResult_);
  349. }
  350. }
  351. }
  352. return parseResult_;
  353. }
  354. //! Parse JSON text (with \ref kParseDefaultFlags)
  355. /*! \tparam InputStream Type of input stream, implementing Stream concept
  356. \tparam Handler Type of handler, implementing Handler concept.
  357. \param is Input stream to be parsed.
  358. \param handler The handler to receive events.
  359. \return Whether the parsing is successful.
  360. */
  361. template <typename InputStream, typename Handler>
  362. ParseResult Parse(InputStream& is, Handler& handler) {
  363. return Parse<kParseDefaultFlags>(is, handler);
  364. }
  365. //! Whether a parse error has occured in the last parsing.
  366. bool HasParseError() const { return parseResult_.IsError(); }
  367. //! Get the \ref ParseErrorCode of last parsing.
  368. ParseErrorCode GetParseErrorCode() const { return parseResult_.Code(); }
  369. //! Get the position of last parsing error in input, 0 otherwise.
  370. size_t GetErrorOffset() const { return parseResult_.Offset(); }
  371. protected:
  372. void SetParseError(ParseErrorCode code, size_t offset) { parseResult_.Set(code, offset); }
  373. private:
  374. // Prohibit copy constructor & assignment operator.
  375. GenericReader(const GenericReader&);
  376. GenericReader& operator=(const GenericReader&);
  377. void ClearStack() { stack_.Clear(); }
  378. // clear stack on any exit from ParseStream, e.g. due to exception
  379. struct ClearStackOnExit {
  380. explicit ClearStackOnExit(GenericReader& r) : r_(r) {}
  381. ~ClearStackOnExit() { r_.ClearStack(); }
  382. private:
  383. GenericReader& r_;
  384. ClearStackOnExit(const ClearStackOnExit&);
  385. ClearStackOnExit& operator=(const ClearStackOnExit&);
  386. };
  387. template<unsigned parseFlags, typename InputStream>
  388. void SkipWhitespaceAndComments(InputStream& is) {
  389. SkipWhitespace(is);
  390. if (parseFlags & kParseCommentsFlag) {
  391. while (is.Peek() == '/') {
  392. is.Take();
  393. if (is.Peek() == '*') {
  394. is.Take();
  395. while (true) {
  396. if (is.Peek() == '\0')
  397. RAPIDJSON_PARSE_ERROR(kParseErrorUnspecificSyntaxError, is.Tell());
  398. if (is.Take() == '*') {
  399. if (is.Peek() == '\0')
  400. RAPIDJSON_PARSE_ERROR(kParseErrorUnspecificSyntaxError, is.Tell());
  401. if (is.Take() == '/')
  402. break;
  403. }
  404. }
  405. } else if (is.Peek() == '/') {
  406. is.Take();
  407. while (is.Peek() != '\0' && is.Take() != '\n') { }
  408. } else {
  409. RAPIDJSON_PARSE_ERROR(kParseErrorUnspecificSyntaxError, is.Tell());
  410. }
  411. SkipWhitespace(is);
  412. }
  413. }
  414. }
  415. // Parse object: { string : value, ... }
  416. template<unsigned parseFlags, typename InputStream, typename Handler>
  417. void ParseObject(InputStream& is, Handler& handler) {
  418. RAPIDJSON_ASSERT(is.Peek() == '{');
  419. is.Take(); // Skip '{'
  420. if (!handler.StartObject())
  421. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, is.Tell());
  422. SkipWhitespaceAndComments<parseFlags>(is);
  423. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  424. if (is.Peek() == '}') {
  425. is.Take();
  426. if (!handler.EndObject(0)) // empty object
  427. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, is.Tell());
  428. return;
  429. }
  430. for (SizeType memberCount = 0;;) {
  431. if (is.Peek() != '"')
  432. RAPIDJSON_PARSE_ERROR(kParseErrorObjectMissName, is.Tell());
  433. ParseString<parseFlags>(is, handler, true);
  434. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  435. SkipWhitespaceAndComments<parseFlags>(is);
  436. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  437. if (is.Take() != ':')
  438. RAPIDJSON_PARSE_ERROR(kParseErrorObjectMissColon, is.Tell());
  439. SkipWhitespaceAndComments<parseFlags>(is);
  440. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  441. ParseValue<parseFlags>(is, handler);
  442. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  443. SkipWhitespaceAndComments<parseFlags>(is);
  444. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  445. ++memberCount;
  446. switch (is.Take()) {
  447. case ',':
  448. SkipWhitespaceAndComments<parseFlags>(is);
  449. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  450. break;
  451. case '}':
  452. if (!handler.EndObject(memberCount))
  453. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, is.Tell());
  454. return;
  455. default:
  456. RAPIDJSON_PARSE_ERROR(kParseErrorObjectMissCommaOrCurlyBracket, is.Tell());
  457. break;
  458. }
  459. }
  460. }
  461. // Parse array: [ value, ... ]
  462. template<unsigned parseFlags, typename InputStream, typename Handler>
  463. void ParseArray(InputStream& is, Handler& handler) {
  464. RAPIDJSON_ASSERT(is.Peek() == '[');
  465. is.Take(); // Skip '['
  466. if (!handler.StartArray())
  467. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, is.Tell());
  468. SkipWhitespaceAndComments<parseFlags>(is);
  469. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  470. if (is.Peek() == ']') {
  471. is.Take();
  472. if (!handler.EndArray(0)) // empty array
  473. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, is.Tell());
  474. return;
  475. }
  476. for (SizeType elementCount = 0;;) {
  477. ParseValue<parseFlags>(is, handler);
  478. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  479. ++elementCount;
  480. SkipWhitespaceAndComments<parseFlags>(is);
  481. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  482. switch (is.Take()) {
  483. case ',':
  484. SkipWhitespaceAndComments<parseFlags>(is);
  485. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  486. break;
  487. case ']':
  488. if (!handler.EndArray(elementCount))
  489. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, is.Tell());
  490. return;
  491. default:
  492. RAPIDJSON_PARSE_ERROR(kParseErrorArrayMissCommaOrSquareBracket, is.Tell());
  493. break;
  494. }
  495. }
  496. }
  497. template<unsigned parseFlags, typename InputStream, typename Handler>
  498. void ParseNull(InputStream& is, Handler& handler) {
  499. RAPIDJSON_ASSERT(is.Peek() == 'n');
  500. is.Take();
  501. if (is.Take() == 'u' && is.Take() == 'l' && is.Take() == 'l') {
  502. if (!handler.Null())
  503. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, is.Tell());
  504. }
  505. else
  506. RAPIDJSON_PARSE_ERROR(kParseErrorValueInvalid, is.Tell() - 1);
  507. }
  508. template<unsigned parseFlags, typename InputStream, typename Handler>
  509. void ParseTrue(InputStream& is, Handler& handler) {
  510. RAPIDJSON_ASSERT(is.Peek() == 't');
  511. is.Take();
  512. if (is.Take() == 'r' && is.Take() == 'u' && is.Take() == 'e') {
  513. if (!handler.Bool(true))
  514. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, is.Tell());
  515. }
  516. else
  517. RAPIDJSON_PARSE_ERROR(kParseErrorValueInvalid, is.Tell() - 1);
  518. }
  519. template<unsigned parseFlags, typename InputStream, typename Handler>
  520. void ParseFalse(InputStream& is, Handler& handler) {
  521. RAPIDJSON_ASSERT(is.Peek() == 'f');
  522. is.Take();
  523. if (is.Take() == 'a' && is.Take() == 'l' && is.Take() == 's' && is.Take() == 'e') {
  524. if (!handler.Bool(false))
  525. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, is.Tell());
  526. }
  527. else
  528. RAPIDJSON_PARSE_ERROR(kParseErrorValueInvalid, is.Tell() - 1);
  529. }
  530. // Helper function to parse four hexidecimal digits in \uXXXX in ParseString().
  531. template<typename InputStream>
  532. unsigned ParseHex4(InputStream& is) {
  533. unsigned codepoint = 0;
  534. for (int i = 0; i < 4; i++) {
  535. Ch c = is.Take();
  536. codepoint <<= 4;
  537. codepoint += static_cast<unsigned>(c);
  538. if (c >= '0' && c <= '9')
  539. codepoint -= '0';
  540. else if (c >= 'A' && c <= 'F')
  541. codepoint -= 'A' - 10;
  542. else if (c >= 'a' && c <= 'f')
  543. codepoint -= 'a' - 10;
  544. else {
  545. RAPIDJSON_PARSE_ERROR_NORETURN(kParseErrorStringUnicodeEscapeInvalidHex, is.Tell() - 1);
  546. RAPIDJSON_PARSE_ERROR_EARLY_RETURN(0);
  547. }
  548. }
  549. return codepoint;
  550. }
  551. template <typename CharType>
  552. class StackStream {
  553. public:
  554. typedef CharType Ch;
  555. StackStream(internal::Stack<StackAllocator>& stack) : stack_(stack), length_(0) {}
  556. RAPIDJSON_FORCEINLINE void Put(Ch c) {
  557. *stack_.template Push<Ch>() = c;
  558. ++length_;
  559. }
  560. size_t Length() const { return length_; }
  561. Ch* Pop() {
  562. return stack_.template Pop<Ch>(length_);
  563. }
  564. private:
  565. StackStream(const StackStream&);
  566. StackStream& operator=(const StackStream&);
  567. internal::Stack<StackAllocator>& stack_;
  568. SizeType length_;
  569. };
  570. // Parse string and generate String event. Different code paths for kParseInsituFlag.
  571. template<unsigned parseFlags, typename InputStream, typename Handler>
  572. void ParseString(InputStream& is, Handler& handler, bool isKey = false) {
  573. internal::StreamLocalCopy<InputStream> copy(is);
  574. InputStream& s(copy.s);
  575. bool success = false;
  576. if (parseFlags & kParseInsituFlag) {
  577. typename InputStream::Ch *head = s.PutBegin();
  578. ParseStringToStream<parseFlags, SourceEncoding, SourceEncoding>(s, s);
  579. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  580. size_t length = s.PutEnd(head) - 1;
  581. RAPIDJSON_ASSERT(length <= 0xFFFFFFFF);
  582. const typename TargetEncoding::Ch* const str = (typename TargetEncoding::Ch*)head;
  583. success = (isKey ? handler.Key(str, SizeType(length), false) : handler.String(str, SizeType(length), false));
  584. }
  585. else {
  586. StackStream<typename TargetEncoding::Ch> stackStream(stack_);
  587. ParseStringToStream<parseFlags, SourceEncoding, TargetEncoding>(s, stackStream);
  588. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  589. SizeType length = static_cast<SizeType>(stackStream.Length()) - 1;
  590. const typename TargetEncoding::Ch* const str = stackStream.Pop();
  591. success = (isKey ? handler.Key(str, length, true) : handler.String(str, length, true));
  592. }
  593. if (!success)
  594. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, s.Tell());
  595. }
  596. // Parse string to an output is
  597. // This function handles the prefix/suffix double quotes, escaping, and optional encoding validation.
  598. template<unsigned parseFlags, typename SEncoding, typename TEncoding, typename InputStream, typename OutputStream>
  599. RAPIDJSON_FORCEINLINE void ParseStringToStream(InputStream& is, OutputStream& os) {
  600. //!@cond RAPIDJSON_HIDDEN_FROM_DOXYGEN
  601. #define Z16 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
  602. static const char escape[256] = {
  603. Z16, Z16, 0, 0,'\"', 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,'/',
  604. Z16, Z16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,'\\', 0, 0, 0,
  605. 0, 0,'\b', 0, 0, 0,'\f', 0, 0, 0, 0, 0, 0, 0,'\n', 0,
  606. 0, 0,'\r', 0,'\t', 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
  607. Z16, Z16, Z16, Z16, Z16, Z16, Z16, Z16
  608. };
  609. #undef Z16
  610. //!@endcond
  611. RAPIDJSON_ASSERT(is.Peek() == '\"');
  612. is.Take(); // Skip '\"'
  613. for (;;) {
  614. Ch c = is.Peek();
  615. if (c == '\\') { // Escape
  616. is.Take();
  617. Ch e = is.Take();
  618. if ((sizeof(Ch) == 1 || unsigned(e) < 256) && escape[(unsigned char)e]) {
  619. os.Put(escape[(unsigned char)e]);
  620. }
  621. else if (e == 'u') { // Unicode
  622. unsigned codepoint = ParseHex4(is);
  623. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  624. if (codepoint >= 0xD800 && codepoint <= 0xDBFF) {
  625. // Handle UTF-16 surrogate pair
  626. if (is.Take() != '\\' || is.Take() != 'u')
  627. RAPIDJSON_PARSE_ERROR(kParseErrorStringUnicodeSurrogateInvalid, is.Tell() - 2);
  628. unsigned codepoint2 = ParseHex4(is);
  629. RAPIDJSON_PARSE_ERROR_EARLY_RETURN_VOID;
  630. if (codepoint2 < 0xDC00 || codepoint2 > 0xDFFF)
  631. RAPIDJSON_PARSE_ERROR(kParseErrorStringUnicodeSurrogateInvalid, is.Tell() - 2);
  632. codepoint = (((codepoint - 0xD800) << 10) | (codepoint2 - 0xDC00)) + 0x10000;
  633. }
  634. TEncoding::Encode(os, codepoint);
  635. }
  636. else
  637. RAPIDJSON_PARSE_ERROR(kParseErrorStringEscapeInvalid, is.Tell() - 1);
  638. }
  639. else if (c == '"') { // Closing double quote
  640. is.Take();
  641. os.Put('\0'); // null-terminate the string
  642. return;
  643. }
  644. else if (c == '\0')
  645. RAPIDJSON_PARSE_ERROR(kParseErrorStringMissQuotationMark, is.Tell() - 1);
  646. else if ((unsigned)c < 0x20) // RFC 4627: unescaped = %x20-21 / %x23-5B / %x5D-10FFFF
  647. RAPIDJSON_PARSE_ERROR(kParseErrorStringEscapeInvalid, is.Tell() - 1);
  648. else {
  649. if (parseFlags & kParseValidateEncodingFlag ?
  650. !Transcoder<SEncoding, TEncoding>::Validate(is, os) :
  651. !Transcoder<SEncoding, TEncoding>::Transcode(is, os))
  652. RAPIDJSON_PARSE_ERROR(kParseErrorStringInvalidEncoding, is.Tell());
  653. }
  654. }
  655. }
  656. template<typename InputStream, bool backup>
  657. class NumberStream;
  658. template<typename InputStream>
  659. class NumberStream<InputStream, false> {
  660. public:
  661. NumberStream(GenericReader& reader, InputStream& s) : is(s) { (void)reader; }
  662. ~NumberStream() {}
  663. RAPIDJSON_FORCEINLINE Ch Peek() const { return is.Peek(); }
  664. RAPIDJSON_FORCEINLINE Ch TakePush() { return is.Take(); }
  665. RAPIDJSON_FORCEINLINE Ch Take() { return is.Take(); }
  666. size_t Tell() { return is.Tell(); }
  667. size_t Length() { return 0; }
  668. const char* Pop() { return 0; }
  669. protected:
  670. NumberStream& operator=(const NumberStream&);
  671. InputStream& is;
  672. };
  673. template<typename InputStream>
  674. class NumberStream<InputStream, true> : public NumberStream<InputStream, false> {
  675. typedef NumberStream<InputStream, false> Base;
  676. public:
  677. NumberStream(GenericReader& reader, InputStream& is) : NumberStream<InputStream, false>(reader, is), stackStream(reader.stack_) {}
  678. ~NumberStream() {}
  679. RAPIDJSON_FORCEINLINE Ch TakePush() {
  680. stackStream.Put((char)Base::is.Peek());
  681. return Base::is.Take();
  682. }
  683. size_t Length() { return stackStream.Length(); }
  684. const char* Pop() {
  685. stackStream.Put('\0');
  686. return stackStream.Pop();
  687. }
  688. private:
  689. StackStream<char> stackStream;
  690. };
  691. template<unsigned parseFlags, typename InputStream, typename Handler>
  692. void ParseNumber(InputStream& is, Handler& handler) {
  693. internal::StreamLocalCopy<InputStream> copy(is);
  694. NumberStream<InputStream, (parseFlags & kParseFullPrecisionFlag) != 0> s(*this, copy.s);
  695. // Parse minus
  696. bool minus = false;
  697. if (s.Peek() == '-') {
  698. minus = true;
  699. s.Take();
  700. }
  701. // Parse int: zero / ( digit1-9 *DIGIT )
  702. unsigned i = 0;
  703. uint64_t i64 = 0;
  704. bool use64bit = false;
  705. int significandDigit = 0;
  706. if (s.Peek() == '0') {
  707. i = 0;
  708. s.TakePush();
  709. }
  710. else if (s.Peek() >= '1' && s.Peek() <= '9') {
  711. i = static_cast<unsigned>(s.TakePush() - '0');
  712. if (minus)
  713. while (s.Peek() >= '0' && s.Peek() <= '9') {
  714. if (i >= 214748364) { // 2^31 = 2147483648
  715. if (i != 214748364 || s.Peek() > '8') {
  716. i64 = i;
  717. use64bit = true;
  718. break;
  719. }
  720. }
  721. i = i * 10 + static_cast<unsigned>(s.TakePush() - '0');
  722. significandDigit++;
  723. }
  724. else
  725. while (s.Peek() >= '0' && s.Peek() <= '9') {
  726. if (i >= 429496729) { // 2^32 - 1 = 4294967295
  727. if (i != 429496729 || s.Peek() > '5') {
  728. i64 = i;
  729. use64bit = true;
  730. break;
  731. }
  732. }
  733. i = i * 10 + static_cast<unsigned>(s.TakePush() - '0');
  734. significandDigit++;
  735. }
  736. }
  737. else
  738. RAPIDJSON_PARSE_ERROR(kParseErrorValueInvalid, s.Tell());
  739. // Parse 64bit int
  740. bool useDouble = false;
  741. double d = 0.0;
  742. if (use64bit) {
  743. if (minus)
  744. while (s.Peek() >= '0' && s.Peek() <= '9') {
  745. if (i64 >= RAPIDJSON_UINT64_C2(0x0CCCCCCC, 0xCCCCCCCC)) // 2^63 = 9223372036854775808
  746. if (i64 != RAPIDJSON_UINT64_C2(0x0CCCCCCC, 0xCCCCCCCC) || s.Peek() > '8') {
  747. d = i64;
  748. useDouble = true;
  749. break;
  750. }
  751. i64 = i64 * 10 + static_cast<unsigned>(s.TakePush() - '0');
  752. significandDigit++;
  753. }
  754. else
  755. while (s.Peek() >= '0' && s.Peek() <= '9') {
  756. if (i64 >= RAPIDJSON_UINT64_C2(0x19999999, 0x99999999)) // 2^64 - 1 = 18446744073709551615
  757. if (i64 != RAPIDJSON_UINT64_C2(0x19999999, 0x99999999) || s.Peek() > '5') {
  758. d = i64;
  759. useDouble = true;
  760. break;
  761. }
  762. i64 = i64 * 10 + static_cast<unsigned>(s.TakePush() - '0');
  763. significandDigit++;
  764. }
  765. }
  766. // Force double for big integer
  767. if (useDouble) {
  768. while (s.Peek() >= '0' && s.Peek() <= '9') {
  769. if (d >= 1.7976931348623157e307) // DBL_MAX / 10.0
  770. RAPIDJSON_PARSE_ERROR(kParseErrorNumberTooBig, s.Tell());
  771. d = d * 10 + (s.TakePush() - '0');
  772. }
  773. }
  774. // Parse frac = decimal-point 1*DIGIT
  775. int expFrac = 0;
  776. size_t decimalPosition;
  777. if (s.Peek() == '.') {
  778. s.Take();
  779. decimalPosition = s.Length();
  780. if (!(s.Peek() >= '0' && s.Peek() <= '9'))
  781. RAPIDJSON_PARSE_ERROR(kParseErrorNumberMissFraction, s.Tell());
  782. if (!useDouble) {
  783. #if RAPIDJSON_64BIT
  784. // Use i64 to store significand in 64-bit architecture
  785. if (!use64bit)
  786. i64 = i;
  787. while (s.Peek() >= '0' && s.Peek() <= '9') {
  788. if (i64 > RAPIDJSON_UINT64_C2(0x1FFFFF, 0xFFFFFFFF)) // 2^53 - 1 for fast path
  789. break;
  790. else {
  791. i64 = i64 * 10 + static_cast<unsigned>(s.TakePush() - '0');
  792. --expFrac;
  793. if (i64 != 0)
  794. significandDigit++;
  795. }
  796. }
  797. d = (double)i64;
  798. #else
  799. // Use double to store significand in 32-bit architecture
  800. d = use64bit ? (double)i64 : (double)i;
  801. #endif
  802. useDouble = true;
  803. }
  804. while (s.Peek() >= '0' && s.Peek() <= '9') {
  805. if (significandDigit < 17) {
  806. d = d * 10.0 + (s.TakePush() - '0');
  807. --expFrac;
  808. if (d > 0.0)
  809. significandDigit++;
  810. }
  811. else
  812. s.TakePush();
  813. }
  814. }
  815. else
  816. decimalPosition = s.Length(); // decimal position at the end of integer.
  817. // Parse exp = e [ minus / plus ] 1*DIGIT
  818. int exp = 0;
  819. if (s.Peek() == 'e' || s.Peek() == 'E') {
  820. if (!useDouble) {
  821. d = use64bit ? i64 : i;
  822. useDouble = true;
  823. }
  824. s.Take();
  825. bool expMinus = false;
  826. if (s.Peek() == '+')
  827. s.Take();
  828. else if (s.Peek() == '-') {
  829. s.Take();
  830. expMinus = true;
  831. }
  832. if (s.Peek() >= '0' && s.Peek() <= '9') {
  833. exp = s.Take() - '0';
  834. if (expMinus) {
  835. while (s.Peek() >= '0' && s.Peek() <= '9') {
  836. exp = exp * 10 + (s.Take() - '0');
  837. if (exp >= 214748364) { // Issue #313: prevent overflow exponent
  838. while (s.Peek() >= '0' && s.Peek() <= '9') // Consume the rest of exponent
  839. s.Take();
  840. }
  841. }
  842. }
  843. else { // positive exp
  844. int maxExp = 308 - expFrac;
  845. while (s.Peek() >= '0' && s.Peek() <= '9') {
  846. exp = exp * 10 + (s.Take() - '0');
  847. if (exp > maxExp)
  848. RAPIDJSON_PARSE_ERROR(kParseErrorNumberTooBig, s.Tell());
  849. }
  850. }
  851. }
  852. else
  853. RAPIDJSON_PARSE_ERROR(kParseErrorNumberMissExponent, s.Tell());
  854. if (expMinus)
  855. exp = -exp;
  856. }
  857. // Finish parsing, call event according to the type of number.
  858. bool cont = true;
  859. size_t length = s.Length();
  860. const char* decimal = s.Pop(); // Pop stack no matter if it will be used or not.
  861. if (useDouble) {
  862. int p = exp + expFrac;
  863. if (parseFlags & kParseFullPrecisionFlag)
  864. d = internal::StrtodFullPrecision(d, p, decimal, length, decimalPosition, exp);
  865. else
  866. d = internal::StrtodNormalPrecision(d, p);
  867. cont = handler.Double(minus ? -d : d);
  868. }
  869. else {
  870. if (use64bit) {
  871. if (minus)
  872. cont = handler.Int64(static_cast<int64_t>(~i64 + 1));
  873. else
  874. cont = handler.Uint64(i64);
  875. }
  876. else {
  877. if (minus)
  878. cont = handler.Int(static_cast<int32_t>(~i + 1));
  879. else
  880. cont = handler.Uint(i);
  881. }
  882. }
  883. if (!cont)
  884. RAPIDJSON_PARSE_ERROR(kParseErrorTermination, s.Tell());
  885. }
  886. // Parse any JSON value
  887. template<unsigned parseFlags, typename InputStream, typename Handler>
  888. void ParseValue(InputStream& is, Handler& handler) {
  889. switch (is.Peek()) {
  890. case 'n': ParseNull <parseFlags>(is, handler); break;
  891. case 't': ParseTrue <parseFlags>(is, handler); break;
  892. case 'f': ParseFalse <parseFlags>(is, handler); break;
  893. case '"': ParseString<parseFlags>(is, handler); break;
  894. case '{': ParseObject<parseFlags>(is, handler); break;
  895. case '[': ParseArray <parseFlags>(is, handler); break;
  896. default :
  897. ParseNumber<parseFlags>(is, handler);
  898. break;
  899. }
  900. }
  901. // Iterative Parsing
  902. // States
  903. enum IterativeParsingState {
  904. IterativeParsingStartState = 0,
  905. IterativeParsingFinishState,
  906. IterativeParsingErrorState,
  907. // Object states
  908. IterativeParsingObjectInitialState,
  909. IterativeParsingMemberKeyState,
  910. IterativeParsingKeyValueDelimiterState,
  911. IterativeParsingMemberValueState,
  912. IterativeParsingMemberDelimiterState,
  913. IterativeParsingObjectFinishState,
  914. // Array states
  915. IterativeParsingArrayInitialState,
  916. IterativeParsingElementState,
  917. IterativeParsingElementDelimiterState,
  918. IterativeParsingArrayFinishState,
  919. // Single value state
  920. IterativeParsingValueState,
  921. cIterativeParsingStateCount
  922. };
  923. // Tokens
  924. enum Token {
  925. LeftBracketToken = 0,
  926. RightBracketToken,
  927. LeftCurlyBracketToken,
  928. RightCurlyBracketToken,
  929. CommaToken,
  930. ColonToken,
  931. StringToken,
  932. FalseToken,
  933. TrueToken,
  934. NullToken,
  935. NumberToken,
  936. kTokenCount
  937. };
  938. RAPIDJSON_FORCEINLINE Token Tokenize(Ch c) {
  939. //!@cond RAPIDJSON_HIDDEN_FROM_DOXYGEN
  940. #define N NumberToken
  941. #define N16 N,N,N,N,N,N,N,N,N,N,N,N,N,N,N,N
  942. // Maps from ASCII to Token
  943. static const unsigned char tokenMap[256] = {
  944. N16, // 00~0F
  945. N16, // 10~1F
  946. N, N, StringToken, N, N, N, N, N, N, N, N, N, CommaToken, N, N, N, // 20~2F
  947. N, N, N, N, N, N, N, N, N, N, ColonToken, N, N, N, N, N, // 30~3F
  948. N16, // 40~4F
  949. N, N, N, N, N, N, N, N, N, N, N, LeftBracketToken, N, RightBracketToken, N, N, // 50~5F
  950. N, N, N, N, N, N, FalseToken, N, N, N, N, N, N, N, NullToken, N, // 60~6F
  951. N, N, N, N, TrueToken, N, N, N, N, N, N, LeftCurlyBracketToken, N, RightCurlyBracketToken, N, N, // 70~7F
  952. N16, N16, N16, N16, N16, N16, N16, N16 // 80~FF
  953. };
  954. #undef N
  955. #undef N16
  956. //!@endcond
  957. if (sizeof(Ch) == 1 || unsigned(c) < 256)
  958. return (Token)tokenMap[(unsigned char)c];
  959. else
  960. return NumberToken;
  961. }
  962. RAPIDJSON_FORCEINLINE IterativeParsingState Predict(IterativeParsingState state, Token token) {
  963. // current state x one lookahead token -> new state
  964. static const char G[cIterativeParsingStateCount][kTokenCount] = {
  965. // Start
  966. {
  967. IterativeParsingArrayInitialState, // Left bracket
  968. IterativeParsingErrorState, // Right bracket
  969. IterativeParsingObjectInitialState, // Left curly bracket
  970. IterativeParsingErrorState, // Right curly bracket
  971. IterativeParsingErrorState, // Comma
  972. IterativeParsingErrorState, // Colon
  973. IterativeParsingValueState, // String
  974. IterativeParsingValueState, // False
  975. IterativeParsingValueState, // True
  976. IterativeParsingValueState, // Null
  977. IterativeParsingValueState // Number
  978. },
  979. // Finish(sink state)
  980. {
  981. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  982. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  983. IterativeParsingErrorState
  984. },
  985. // Error(sink state)
  986. {
  987. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  988. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  989. IterativeParsingErrorState
  990. },
  991. // ObjectInitial
  992. {
  993. IterativeParsingErrorState, // Left bracket
  994. IterativeParsingErrorState, // Right bracket
  995. IterativeParsingErrorState, // Left curly bracket
  996. IterativeParsingObjectFinishState, // Right curly bracket
  997. IterativeParsingErrorState, // Comma
  998. IterativeParsingErrorState, // Colon
  999. IterativeParsingMemberKeyState, // String
  1000. IterativeParsingErrorState, // False
  1001. IterativeParsingErrorState, // True
  1002. IterativeParsingErrorState, // Null
  1003. IterativeParsingErrorState // Number
  1004. },
  1005. // MemberKey
  1006. {
  1007. IterativeParsingErrorState, // Left bracket
  1008. IterativeParsingErrorState, // Right bracket
  1009. IterativeParsingErrorState, // Left curly bracket
  1010. IterativeParsingErrorState, // Right curly bracket
  1011. IterativeParsingErrorState, // Comma
  1012. IterativeParsingKeyValueDelimiterState, // Colon
  1013. IterativeParsingErrorState, // String
  1014. IterativeParsingErrorState, // False
  1015. IterativeParsingErrorState, // True
  1016. IterativeParsingErrorState, // Null
  1017. IterativeParsingErrorState // Number
  1018. },
  1019. // KeyValueDelimiter
  1020. {
  1021. IterativeParsingArrayInitialState, // Left bracket(push MemberValue state)
  1022. IterativeParsingErrorState, // Right bracket
  1023. IterativeParsingObjectInitialState, // Left curly bracket(push MemberValue state)
  1024. IterativeParsingErrorState, // Right curly bracket
  1025. IterativeParsingErrorState, // Comma
  1026. IterativeParsingErrorState, // Colon
  1027. IterativeParsingMemberValueState, // String
  1028. IterativeParsingMemberValueState, // False
  1029. IterativeParsingMemberValueState, // True
  1030. IterativeParsingMemberValueState, // Null
  1031. IterativeParsingMemberValueState // Number
  1032. },
  1033. // MemberValue
  1034. {
  1035. IterativeParsingErrorState, // Left bracket
  1036. IterativeParsingErrorState, // Right bracket
  1037. IterativeParsingErrorState, // Left curly bracket
  1038. IterativeParsingObjectFinishState, // Right curly bracket
  1039. IterativeParsingMemberDelimiterState, // Comma
  1040. IterativeParsingErrorState, // Colon
  1041. IterativeParsingErrorState, // String
  1042. IterativeParsingErrorState, // False
  1043. IterativeParsingErrorState, // True
  1044. IterativeParsingErrorState, // Null
  1045. IterativeParsingErrorState // Number
  1046. },
  1047. // MemberDelimiter
  1048. {
  1049. IterativeParsingErrorState, // Left bracket
  1050. IterativeParsingErrorState, // Right bracket
  1051. IterativeParsingErrorState, // Left curly bracket
  1052. IterativeParsingErrorState, // Right curly bracket
  1053. IterativeParsingErrorState, // Comma
  1054. IterativeParsingErrorState, // Colon
  1055. IterativeParsingMemberKeyState, // String
  1056. IterativeParsingErrorState, // False
  1057. IterativeParsingErrorState, // True
  1058. IterativeParsingErrorState, // Null
  1059. IterativeParsingErrorState // Number
  1060. },
  1061. // ObjectFinish(sink state)
  1062. {
  1063. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  1064. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  1065. IterativeParsingErrorState
  1066. },
  1067. // ArrayInitial
  1068. {
  1069. IterativeParsingArrayInitialState, // Left bracket(push Element state)
  1070. IterativeParsingArrayFinishState, // Right bracket
  1071. IterativeParsingObjectInitialState, // Left curly bracket(push Element state)
  1072. IterativeParsingErrorState, // Right curly bracket
  1073. IterativeParsingErrorState, // Comma
  1074. IterativeParsingErrorState, // Colon
  1075. IterativeParsingElementState, // String
  1076. IterativeParsingElementState, // False
  1077. IterativeParsingElementState, // True
  1078. IterativeParsingElementState, // Null
  1079. IterativeParsingElementState // Number
  1080. },
  1081. // Element
  1082. {
  1083. IterativeParsingErrorState, // Left bracket
  1084. IterativeParsingArrayFinishState, // Right bracket
  1085. IterativeParsingErrorState, // Left curly bracket
  1086. IterativeParsingErrorState, // Right curly bracket
  1087. IterativeParsingElementDelimiterState, // Comma
  1088. IterativeParsingErrorState, // Colon
  1089. IterativeParsingErrorState, // String
  1090. IterativeParsingErrorState, // False
  1091. IterativeParsingErrorState, // True
  1092. IterativeParsingErrorState, // Null
  1093. IterativeParsingErrorState // Number
  1094. },
  1095. // ElementDelimiter
  1096. {
  1097. IterativeParsingArrayInitialState, // Left bracket(push Element state)
  1098. IterativeParsingErrorState, // Right bracket
  1099. IterativeParsingObjectInitialState, // Left curly bracket(push Element state)
  1100. IterativeParsingErrorState, // Right curly bracket
  1101. IterativeParsingErrorState, // Comma
  1102. IterativeParsingErrorState, // Colon
  1103. IterativeParsingElementState, // String
  1104. IterativeParsingElementState, // False
  1105. IterativeParsingElementState, // True
  1106. IterativeParsingElementState, // Null
  1107. IterativeParsingElementState // Number
  1108. },
  1109. // ArrayFinish(sink state)
  1110. {
  1111. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  1112. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  1113. IterativeParsingErrorState
  1114. },
  1115. // Single Value (sink state)
  1116. {
  1117. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  1118. IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState, IterativeParsingErrorState,
  1119. IterativeParsingErrorState
  1120. }
  1121. }; // End of G
  1122. return (IterativeParsingState)G[state][token];
  1123. }
  1124. // Make an advance in the token stream and state based on the candidate destination state which was returned by Transit().
  1125. // May return a new state on state pop.
  1126. template <unsigned parseFlags, typename InputStream, typename Handler>
  1127. RAPIDJSON_FORCEINLINE IterativeParsingState Transit(IterativeParsingState src, Token token, IterativeParsingState dst, InputStream& is, Handler& handler) {
  1128. (void)token;
  1129. switch (dst) {
  1130. case IterativeParsingErrorState:
  1131. return dst;
  1132. case IterativeParsingObjectInitialState:
  1133. case IterativeParsingArrayInitialState:
  1134. {
  1135. // Push the state(Element or MemeberValue) if we are nested in another array or value of member.
  1136. // In this way we can get the correct state on ObjectFinish or ArrayFinish by frame pop.
  1137. IterativeParsingState n = src;
  1138. if (src == IterativeParsingArrayInitialState || src == IterativeParsingElementDelimiterState)
  1139. n = IterativeParsingElementState;
  1140. else if (src == IterativeParsingKeyValueDelimiterState)
  1141. n = IterativeParsingMemberValueState;
  1142. // Push current state.
  1143. *stack_.template Push<SizeType>(1) = n;
  1144. // Initialize and push the member/element count.
  1145. *stack_.template Push<SizeType>(1) = 0;
  1146. // Call handler
  1147. bool hr = (dst == IterativeParsingObjectInitialState) ? handler.StartObject() : handler.StartArray();
  1148. // On handler short circuits the parsing.
  1149. if (!hr) {
  1150. RAPIDJSON_PARSE_ERROR_NORETURN(kParseErrorTermination, is.Tell());
  1151. return IterativeParsingErrorState;
  1152. }
  1153. else {
  1154. is.Take();
  1155. return dst;
  1156. }
  1157. }
  1158. case IterativeParsingMemberKeyState:
  1159. ParseString<parseFlags>(is, handler, true);
  1160. if (HasParseError())
  1161. return IterativeParsingErrorState;
  1162. else
  1163. return dst;
  1164. case IterativeParsingKeyValueDelimiterState:
  1165. RAPIDJSON_ASSERT(token == ColonToken);
  1166. is.Take();
  1167. return dst;
  1168. case IterativeParsingMemberValueState:
  1169. // Must be non-compound value. Or it would be ObjectInitial or ArrayInitial state.
  1170. ParseValue<parseFlags>(is, handler);
  1171. if (HasParseError()) {
  1172. return IterativeParsingErrorState;
  1173. }
  1174. return dst;
  1175. case IterativeParsingElementState:
  1176. // Must be non-compound value. Or it would be ObjectInitial or ArrayInitial state.
  1177. ParseValue<parseFlags>(is, handler);
  1178. if (HasParseError()) {
  1179. return IterativeParsingErrorState;
  1180. }
  1181. return dst;
  1182. case IterativeParsingMemberDelimiterState:
  1183. case IterativeParsingElementDelimiterState:
  1184. is.Take();
  1185. // Update member/element count.
  1186. *stack_.template Top<SizeType>() = *stack_.template Top<SizeType>() + 1;
  1187. return dst;
  1188. case IterativeParsingObjectFinishState:
  1189. {
  1190. // Get member count.
  1191. SizeType c = *stack_.template Pop<SizeType>(1);
  1192. // If the object is not empty, count the last member.
  1193. if (src == IterativeParsingMemberValueState)
  1194. ++c;
  1195. // Restore the state.
  1196. IterativeParsingState n = static_cast<IterativeParsingState>(*stack_.template Pop<SizeType>(1));
  1197. // Transit to Finish state if this is the topmost scope.
  1198. if (n == IterativeParsingStartState)
  1199. n = IterativeParsingFinishState;
  1200. // Call handler
  1201. bool hr = handler.EndObject(c);
  1202. // On handler short circuits the parsing.
  1203. if (!hr) {
  1204. RAPIDJSON_PARSE_ERROR_NORETURN(kParseErrorTermination, is.Tell());
  1205. return IterativeParsingErrorState;
  1206. }
  1207. else {
  1208. is.Take();
  1209. return n;
  1210. }
  1211. }
  1212. case IterativeParsingArrayFinishState:
  1213. {
  1214. // Get element count.
  1215. SizeType c = *stack_.template Pop<SizeType>(1);
  1216. // If the array is not empty, count the last element.
  1217. if (src == IterativeParsingElementState)
  1218. ++c;
  1219. // Restore the state.
  1220. IterativeParsingState n = static_cast<IterativeParsingState>(*stack_.template Pop<SizeType>(1));
  1221. // Transit to Finish state if this is the topmost scope.
  1222. if (n == IterativeParsingStartState)
  1223. n = IterativeParsingFinishState;
  1224. // Call handler
  1225. bool hr = handler.EndArray(c);
  1226. // On handler short circuits the parsing.
  1227. if (!hr) {
  1228. RAPIDJSON_PARSE_ERROR_NORETURN(kParseErrorTermination, is.Tell());
  1229. return IterativeParsingErrorState;
  1230. }
  1231. else {
  1232. is.Take();
  1233. return n;
  1234. }
  1235. }
  1236. default:
  1237. // This branch is for IterativeParsingValueState actually.
  1238. // Use `default:` rather than
  1239. // `case IterativeParsingValueState:` is for code coverage.
  1240. // The IterativeParsingStartState is not enumerated in this switch-case.
  1241. // It is impossible for that case. And it can be caught by following assertion.
  1242. // The IterativeParsingFinishState is not enumerated in this switch-case either.
  1243. // It is a "derivative" state which cannot triggered from Predict() directly.
  1244. // Therefore it cannot happen here. And it can be caught by following assertion.
  1245. RAPIDJSON_ASSERT(dst == IterativeParsingValueState);
  1246. // Must be non-compound value. Or it would be ObjectInitial or ArrayInitial state.
  1247. ParseValue<parseFlags>(is, handler);
  1248. if (HasParseError()) {
  1249. return IterativeParsingErrorState;
  1250. }
  1251. return IterativeParsingFinishState;
  1252. }
  1253. }
  1254. template <typename InputStream>
  1255. void HandleError(IterativeParsingState src, InputStream& is) {
  1256. if (HasParseError()) {
  1257. // Error flag has been set.
  1258. return;
  1259. }
  1260. switch (src) {
  1261. case IterativeParsingStartState: RAPIDJSON_PARSE_ERROR(kParseErrorDocumentEmpty, is.Tell()); return;
  1262. case IterativeParsingFinishState: RAPIDJSON_PARSE_ERROR(kParseErrorDocumentRootNotSingular, is.Tell()); return;
  1263. case IterativeParsingObjectInitialState:
  1264. case IterativeParsingMemberDelimiterState: RAPIDJSON_PARSE_ERROR(kParseErrorObjectMissName, is.Tell()); return;
  1265. case IterativeParsingMemberKeyState: RAPIDJSON_PARSE_ERROR(kParseErrorObjectMissColon, is.Tell()); return;
  1266. case IterativeParsingMemberValueState: RAPIDJSON_PARSE_ERROR(kParseErrorObjectMissCommaOrCurlyBracket, is.Tell()); return;
  1267. case IterativeParsingElementState: RAPIDJSON_PARSE_ERROR(kParseErrorArrayMissCommaOrSquareBracket, is.Tell()); return;
  1268. default: RAPIDJSON_PARSE_ERROR(kParseErrorUnspecificSyntaxError, is.Tell()); return;
  1269. }
  1270. }
  1271. template <unsigned parseFlags, typename InputStream, typename Handler>
  1272. ParseResult IterativeParse(InputStream& is, Handler& handler) {
  1273. parseResult_.Clear();
  1274. ClearStackOnExit scope(*this);
  1275. IterativeParsingState state = IterativeParsingStartState;
  1276. SkipWhitespaceAndComments<parseFlags>(is);
  1277. RAPIDJSON_PARSE_ERROR_EARLY_RETURN(parseResult_);
  1278. while (is.Peek() != '\0') {
  1279. Token t = Tokenize(is.Peek());
  1280. IterativeParsingState n = Predict(state, t);
  1281. IterativeParsingState d = Transit<parseFlags>(state, t, n, is, handler);
  1282. if (d == IterativeParsingErrorState) {
  1283. HandleError(state, is);
  1284. break;
  1285. }
  1286. state = d;
  1287. // Do not further consume streams if a root JSON has been parsed.
  1288. if ((parseFlags & kParseStopWhenDoneFlag) && state == IterativeParsingFinishState)
  1289. break;
  1290. SkipWhitespaceAndComments<parseFlags>(is);
  1291. RAPIDJSON_PARSE_ERROR_EARLY_RETURN(parseResult_);
  1292. }
  1293. // Handle the end of file.
  1294. if (state != IterativeParsingFinishState)
  1295. HandleError(state, is);
  1296. return parseResult_;
  1297. }
  1298. static const size_t kDefaultStackCapacity = 256; //!< Default stack capacity in bytes for storing a single decoded string.
  1299. internal::Stack<StackAllocator> stack_; //!< A stack for storing decoded string temporarily during non-destructive parsing.
  1300. ParseResult parseResult_;
  1301. }; // class GenericReader
  1302. //! Reader with UTF8 encoding and default allocator.
  1303. typedef GenericReader<UTF8<>, UTF8<> > Reader;
  1304. RAPIDJSON_NAMESPACE_END
  1305. #ifdef __GNUC__
  1306. RAPIDJSON_DIAG_POP
  1307. #endif
  1308. #ifdef _MSC_VER
  1309. RAPIDJSON_DIAG_POP
  1310. #endif
  1311. #endif // RAPIDJSON_READER_H_