You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
190 lines
5.6 KiB
190 lines
5.6 KiB
// Copyright (c) 2013 The Chromium Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
// found in the LICENSE file.
|
|
|
|
#include "base/json/string_escape.h"
|
|
|
|
#include <stddef.h>
|
|
|
|
#include "base/macros.h"
|
|
#include "base/strings/string_util.h"
|
|
#include "base/strings/utf_string_conversions.h"
|
|
#include "testing/gtest/include/gtest/gtest.h"
|
|
|
|
namespace base {
|
|
|
|
TEST(JSONStringEscapeTest, EscapeUTF8) {
|
|
const struct {
|
|
const char* to_escape;
|
|
const char* escaped;
|
|
} cases[] = {
|
|
{"\b\001aZ\"\\wee", "\\b\\u0001aZ\\\"\\\\wee"},
|
|
{"a\b\f\n\r\t\v\1\\.\"z", "a\\b\\f\\n\\r\\t\\u000B\\u0001\\\\.\\\"z"},
|
|
{"b\x0f\x7f\xf0\xff!", // \xf0\xff is not a valid UTF-8 unit.
|
|
"b\\u000F\x7F\xEF\xBF\xBD\xEF\xBF\xBD!"},
|
|
{"c<>d", "c\\u003C>d"},
|
|
{"Hello\xe2\x80\xa8world", "Hello\\u2028world"},
|
|
{"\xe2\x80\xa9purple", "\\u2029purple"},
|
|
{"\xF3\xBF\xBF\xBF", "\xEF\xBF\xBD"},
|
|
};
|
|
|
|
for (size_t i = 0; i < arraysize(cases); ++i) {
|
|
const char* in_ptr = cases[i].to_escape;
|
|
std::string in_str = in_ptr;
|
|
|
|
std::string out;
|
|
EscapeJSONString(in_ptr, false, &out);
|
|
EXPECT_EQ(std::string(cases[i].escaped), out);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
|
|
out.erase();
|
|
bool convert_ok = EscapeJSONString(in_str, false, &out);
|
|
EXPECT_EQ(std::string(cases[i].escaped), out);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
|
|
if (convert_ok) {
|
|
std::string fooout = GetQuotedJSONString(in_str);
|
|
EXPECT_EQ("\"" + std::string(cases[i].escaped) + "\"", fooout);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
}
|
|
}
|
|
|
|
std::string in = cases[0].to_escape;
|
|
std::string out;
|
|
EscapeJSONString(in, false, &out);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
|
|
// test quoting
|
|
std::string out_quoted;
|
|
EscapeJSONString(in, true, &out_quoted);
|
|
EXPECT_EQ(out.length() + 2, out_quoted.length());
|
|
EXPECT_EQ(out_quoted.find(out), 1U);
|
|
EXPECT_TRUE(IsStringUTF8(out_quoted));
|
|
|
|
// now try with a NULL in the string
|
|
std::string null_prepend = "test";
|
|
null_prepend.push_back(0);
|
|
in = null_prepend + in;
|
|
std::string expected = "test\\u0000";
|
|
expected += cases[0].escaped;
|
|
out.clear();
|
|
EscapeJSONString(in, false, &out);
|
|
EXPECT_EQ(expected, out);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
}
|
|
|
|
TEST(JSONStringEscapeTest, EscapeUTF16) {
|
|
const struct {
|
|
const wchar_t* to_escape;
|
|
const char* escaped;
|
|
} cases[] = {
|
|
{L"b\uffb1\u00ff", "b\xEF\xBE\xB1\xC3\xBF"},
|
|
{L"\b\001aZ\"\\wee", "\\b\\u0001aZ\\\"\\\\wee"},
|
|
{L"a\b\f\n\r\t\v\1\\.\"z",
|
|
"a\\b\\f\\n\\r\\t\\u000B\\u0001\\\\.\\\"z"},
|
|
{L"b\x0f\x7f\xf0\xff!", "b\\u000F\x7F\xC3\xB0\xC3\xBF!"},
|
|
{L"c<>d", "c\\u003C>d"},
|
|
{L"Hello\u2028world", "Hello\\u2028world"},
|
|
{L"\u2029purple", "\\u2029purple"},
|
|
};
|
|
|
|
for (size_t i = 0; i < arraysize(cases); ++i) {
|
|
string16 in = WideToUTF16(cases[i].to_escape);
|
|
|
|
std::string out;
|
|
EscapeJSONString(in, false, &out);
|
|
EXPECT_EQ(std::string(cases[i].escaped), out);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
|
|
out = GetQuotedJSONString(in);
|
|
EXPECT_EQ("\"" + std::string(cases[i].escaped) + "\"", out);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
}
|
|
|
|
string16 in = WideToUTF16(cases[0].to_escape);
|
|
std::string out;
|
|
EscapeJSONString(in, false, &out);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
|
|
// test quoting
|
|
std::string out_quoted;
|
|
EscapeJSONString(in, true, &out_quoted);
|
|
EXPECT_EQ(out.length() + 2, out_quoted.length());
|
|
EXPECT_EQ(out_quoted.find(out), 1U);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
|
|
// now try with a NULL in the string
|
|
string16 null_prepend = WideToUTF16(L"test");
|
|
null_prepend.push_back(0);
|
|
in = null_prepend + in;
|
|
std::string expected = "test\\u0000";
|
|
expected += cases[0].escaped;
|
|
out.clear();
|
|
EscapeJSONString(in, false, &out);
|
|
EXPECT_EQ(expected, out);
|
|
EXPECT_TRUE(IsStringUTF8(out));
|
|
}
|
|
|
|
TEST(JSONStringEscapeTest, EscapeUTF16OutsideBMP) {
|
|
{
|
|
// {a, U+10300, !}, SMP.
|
|
string16 test;
|
|
test.push_back('a');
|
|
test.push_back(0xD800);
|
|
test.push_back(0xDF00);
|
|
test.push_back('!');
|
|
std::string actual;
|
|
EXPECT_TRUE(EscapeJSONString(test, false, &actual));
|
|
EXPECT_EQ("a\xF0\x90\x8C\x80!", actual);
|
|
}
|
|
{
|
|
// {U+20021, U+2002B}, SIP.
|
|
string16 test;
|
|
test.push_back(0xD840);
|
|
test.push_back(0xDC21);
|
|
test.push_back(0xD840);
|
|
test.push_back(0xDC2B);
|
|
std::string actual;
|
|
EXPECT_TRUE(EscapeJSONString(test, false, &actual));
|
|
EXPECT_EQ("\xF0\xA0\x80\xA1\xF0\xA0\x80\xAB", actual);
|
|
}
|
|
{
|
|
// {?, U+D800, @}, lone surrogate.
|
|
string16 test;
|
|
test.push_back('?');
|
|
test.push_back(0xD800);
|
|
test.push_back('@');
|
|
std::string actual;
|
|
EXPECT_FALSE(EscapeJSONString(test, false, &actual));
|
|
EXPECT_EQ("?\xEF\xBF\xBD@", actual);
|
|
}
|
|
}
|
|
|
|
TEST(JSONStringEscapeTest, EscapeBytes) {
|
|
const struct {
|
|
const char* to_escape;
|
|
const char* escaped;
|
|
} cases[] = {
|
|
{"b\x0f\x7f\xf0\xff!", "b\\u000F\\u007F\\u00F0\\u00FF!"},
|
|
{"\xe5\xc4\x4f\x05\xb6\xfd", "\\u00E5\\u00C4O\\u0005\\u00B6\\u00FD"},
|
|
};
|
|
|
|
for (size_t i = 0; i < arraysize(cases); ++i) {
|
|
std::string in = std::string(cases[i].to_escape);
|
|
EXPECT_FALSE(IsStringUTF8(in));
|
|
|
|
EXPECT_EQ(std::string(cases[i].escaped),
|
|
EscapeBytesAsInvalidJSONString(in, false));
|
|
EXPECT_EQ("\"" + std::string(cases[i].escaped) + "\"",
|
|
EscapeBytesAsInvalidJSONString(in, true));
|
|
}
|
|
|
|
const char kEmbedNull[] = { '\xab', '\x39', '\0', '\x9f', '\xab' };
|
|
std::string in(kEmbedNull, arraysize(kEmbedNull));
|
|
EXPECT_FALSE(IsStringUTF8(in));
|
|
EXPECT_EQ(std::string("\\u00AB9\\u0000\\u009F\\u00AB"),
|
|
EscapeBytesAsInvalidJSONString(in, false));
|
|
}
|
|
|
|
} // namespace base
|