Fixing json parser issue when using streams with escaped characters.

stgates · stgates · commit 9fcc601ce6a0 · 2015-04-02T20:13:29.000-07:00
diff --git a/Release/src/json/json_parsing.cpp b/Release/src/json/json_parsing.cpp
@@ -716,6 +716,8 @@ void convert_append_unicode_code_unit(JSON_Parser<char>::Token &token, utf16char
 template <typename CharType>
 inline bool JSON_Parser<CharType>::handle_unescape_char(Token &token)
 {
+    token.has_unescape_symbol = true;
+
     // This function converts unescaped character pairs (e.g. "\t") into their ASCII or Unicode representations (e.g. tab sign)
     // Also it handles \u + 4 hexadecimal digits
     auto ch = NextCharacter();
@@ -784,6 +786,7 @@ inline bool JSON_Parser<CharType>::handle_unescape_char(Token &token)
 template <typename CharType>
 bool JSON_Parser<CharType>::CompleteStringLiteral(Token &token)
 {
+    token.has_unescape_symbol = false;
     auto ch = NextCharacter();
     while ( ch != '"' )
     {
@@ -836,13 +839,18 @@ bool JSON_StringParser<CharType>::CompleteStringLiteral(typename JSON_Parser<Cha
 
         if (ch == '\\')
         {
-            token.string_val.resize(m_position - start - 1);
-            if (token.string_val.size() > 0)
-                memcpy(&token.string_val[0], start, (m_position - start - 1)*sizeof(CharType));
+            const size_t numChars = m_position - start - 1;
+            const size_t prevSize = token.string_val.size();
+            token.string_val.resize(prevSize + numChars);
+            memcpy(const_cast<CharType *>(token.string_val.c_str() + prevSize), start, numChars * sizeof(CharType));
 
-            token.has_unescape_symbol = true;
+            if (!JSON_StringParser<CharType>::handle_unescape_char(token))
+            {
+                return false;
+            }
 
-            return finish_parsing_string_with_unescape_char(token);
+            // Reset start position and continue.
+            start = m_position;
         }
         else if (ch >= CharType(0x0) && ch < CharType(0x20))
         {
@@ -852,47 +860,16 @@ bool JSON_StringParser<CharType>::CompleteStringLiteral(typename JSON_Parser<Cha
         ch = JSON_StringParser<CharType>::NextCharacter();
     }
 
-    token.string_val.resize(m_position - start - 1);
-    if (token.string_val.size() > 0)
-        memcpy(&token.string_val[0], start, (m_position - start - 1)*sizeof(CharType));
+    const size_t numChars = m_position - start - 1;
+    const size_t prevSize = token.string_val.size();
+    token.string_val.resize(prevSize + numChars);
+    memcpy(const_cast<CharType *>(token.string_val.c_str() + prevSize), start, numChars * sizeof(CharType));
 
     token.kind = JSON_Parser<CharType>::Token::TKN_StringLiteral;
 
     return true;
 }
 
-template <typename CharType>
-bool JSON_StringParser<CharType>::finish_parsing_string_with_unescape_char(typename JSON_Parser<CharType>::Token &token)
-{
-    // This function handles parsing the string when an unescape character is encountered.
-    // It is called once the part before the unescape char is copied to the token.string_val string
-
-    typename JSON_Parser<CharType>::int_type ch;
-
-    if (!JSON_StringParser<CharType>::handle_unescape_char(token))
-        return false;
-
-    while ((ch = JSON_StringParser<CharType>::NextCharacter()) != '"')
-    {
-        if (ch == '\\')
-        {
-            if (!JSON_StringParser<CharType>::handle_unescape_char(token))
-                return false;
-        }
-        else
-        {
-            if (ch == eof<CharType>())
-                return false;
-
-            token.string_val.push_back(static_cast<CharType>(ch));
-        }
-    }
-
-    token.kind = JSON_StringParser<CharType>::Token::TKN_StringLiteral;
-
-    return true;
-}
-
 template <typename CharType>
 void JSON_Parser<CharType>::GetNextToken(typename JSON_Parser<CharType>::Token& result)
 {
diff --git a/Release/tests/functional/json/parsing_tests.cpp b/Release/tests/functional/json/parsing_tests.cpp
@@ -278,6 +278,10 @@ TEST(escaping_control_characters)
         const auto &v = json::value::parse(str);
         VERIFY_IS_TRUE(v.is_string());
         VERIFY_ARE_EQUAL(expectedStr, v.serialize());
+
+        // Try parsing a stringstream.
+        const auto &ssv = json::value::parse(ss);
+        VERIFY_ARE_EQUAL(expectedStr, ssv.serialize());
     }
 }
 

Original file line number	Diff line number	Diff line change
`@@ -278,6 +278,10 @@ TEST(escaping_control_characters)`
`278`	`278`	`const auto &v = json::value::parse(str);`
`279`	`279`	`VERIFY_IS_TRUE(v.is_string());`
`280`	`280`	`VERIFY_ARE_EQUAL(expectedStr, v.serialize());`
	`281`	`+`
	`282`	`+ // Try parsing a stringstream.`
	`283`	`+ const auto &ssv = json::value::parse(ss);`
	`284`	`+ VERIFY_ARE_EQUAL(expectedStr, ssv.serialize());`
`281`	`285`	`}`
`282`	`286`	`}`
`283`	`287`