| //===-- JSONTest.cpp - JSON unit tests --------------------------*- C++ -*-===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "llvm/Support/JSON.h" |
| |
| #include "gmock/gmock.h" |
| #include "gtest/gtest.h" |
| |
| namespace llvm { |
| namespace json { |
| |
| namespace { |
| |
| std::string s(const Value &E) { return llvm::formatv("{0}", E).str(); } |
| std::string sp(const Value &E) { return llvm::formatv("{0:2}", E).str(); } |
| |
| TEST(JSONTest, Types) { |
| EXPECT_EQ("true", s(true)); |
| EXPECT_EQ("null", s(nullptr)); |
| EXPECT_EQ("2.5", s(2.5)); |
| EXPECT_EQ(R"("foo")", s("foo")); |
| EXPECT_EQ("[1,2,3]", s({1, 2, 3})); |
| EXPECT_EQ(R"({"x":10,"y":20})", s(Object{{"x", 10}, {"y", 20}})); |
| |
| #ifdef NDEBUG |
| EXPECT_EQ(R"("��")", s("\xC0\x80")); |
| EXPECT_EQ(R"({"��":0})", s(Object{{"\xC0\x80", 0}})); |
| #else |
| EXPECT_DEATH(s("\xC0\x80"), "Invalid UTF-8"); |
| EXPECT_DEATH(s(Object{{"\xC0\x80", 0}}), "Invalid UTF-8"); |
| #endif |
| } |
| |
| TEST(JSONTest, Constructors) { |
| // Lots of edge cases around empty and singleton init lists. |
| EXPECT_EQ("[[[3]]]", s({{{3}}})); |
| EXPECT_EQ("[[[]]]", s({{{}}})); |
| EXPECT_EQ("[[{}]]", s({{Object{}}})); |
| EXPECT_EQ(R"({"A":{"B":{}}})", s(Object{{"A", Object{{"B", Object{}}}}})); |
| EXPECT_EQ(R"({"A":{"B":{"X":"Y"}}})", |
| s(Object{{"A", Object{{"B", Object{{"X", "Y"}}}}}})); |
| EXPECT_EQ("null", s(llvm::Optional<double>())); |
| EXPECT_EQ("2.5", s(llvm::Optional<double>(2.5))); |
| } |
| |
| TEST(JSONTest, StringOwnership) { |
| char X[] = "Hello"; |
| Value Alias = static_cast<const char *>(X); |
| X[1] = 'a'; |
| EXPECT_EQ(R"("Hallo")", s(Alias)); |
| |
| std::string Y = "Hello"; |
| Value Copy = Y; |
| Y[1] = 'a'; |
| EXPECT_EQ(R"("Hello")", s(Copy)); |
| } |
| |
| TEST(JSONTest, CanonicalOutput) { |
| // Objects are sorted (but arrays aren't)! |
| EXPECT_EQ(R"({"a":1,"b":2,"c":3})", s(Object{{"a", 1}, {"c", 3}, {"b", 2}})); |
| EXPECT_EQ(R"(["a","c","b"])", s({"a", "c", "b"})); |
| EXPECT_EQ("3", s(3.0)); |
| } |
| |
| TEST(JSONTest, Escaping) { |
| std::string test = { |
| 0, // Strings may contain nulls. |
| '\b', '\f', // Have mnemonics, but we escape numerically. |
| '\r', '\n', '\t', // Escaped with mnemonics. |
| 'S', '\"', '\\', // Printable ASCII characters. |
| '\x7f', // Delete is not escaped. |
| '\xce', '\x94', // Non-ASCII UTF-8 is not escaped. |
| }; |
| |
| std::string teststring = R"("\u0000\u0008\u000c\r\n\tS\"\\)" |
| "\x7f\xCE\x94\""; |
| |
| EXPECT_EQ(teststring, s(test)); |
| |
| EXPECT_EQ(R"({"object keys are\nescaped":true})", |
| s(Object{{"object keys are\nescaped", true}})); |
| } |
| |
| TEST(JSONTest, PrettyPrinting) { |
| const char str[] = R"({ |
| "empty_array": [], |
| "empty_object": {}, |
| "full_array": [ |
| 1, |
| null |
| ], |
| "full_object": { |
| "nested_array": [ |
| { |
| "property": "value" |
| } |
| ] |
| } |
| })"; |
| |
| EXPECT_EQ(str, sp(Object{ |
| {"empty_object", Object{}}, |
| {"empty_array", {}}, |
| {"full_array", {1, nullptr}}, |
| {"full_object", |
| Object{ |
| {"nested_array", |
| {Object{ |
| {"property", "value"}, |
| }}}, |
| }}, |
| })); |
| } |
| |
| TEST(JSONTest, Parse) { |
| auto Compare = [](llvm::StringRef S, Value Expected) { |
| if (auto E = parse(S)) { |
| // Compare both string forms and with operator==, in case we have bugs. |
| EXPECT_EQ(*E, Expected); |
| EXPECT_EQ(sp(*E), sp(Expected)); |
| } else { |
| handleAllErrors(E.takeError(), [S](const llvm::ErrorInfoBase &E) { |
| FAIL() << "Failed to parse JSON >>> " << S << " <<<: " << E.message(); |
| }); |
| } |
| }; |
| |
| Compare(R"(true)", true); |
| Compare(R"(false)", false); |
| Compare(R"(null)", nullptr); |
| |
| Compare(R"(42)", 42); |
| Compare(R"(2.5)", 2.5); |
| Compare(R"(2e50)", 2e50); |
| Compare(R"(1.2e3456789)", std::numeric_limits<double>::infinity()); |
| |
| Compare(R"("foo")", "foo"); |
| Compare(R"("\"\\\b\f\n\r\t")", "\"\\\b\f\n\r\t"); |
| Compare(R"("\u0000")", llvm::StringRef("\0", 1)); |
| Compare("\"\x7f\"", "\x7f"); |
| Compare(R"("\ud801\udc37")", u8"\U00010437"); // UTF16 surrogate pair escape. |
| Compare("\"\xE2\x82\xAC\xF0\x9D\x84\x9E\"", u8"\u20ac\U0001d11e"); // UTF8 |
| Compare( |
| R"("LoneLeading=\ud801, LoneTrailing=\udc01, LeadingLeadingTrailing=\ud801\ud801\udc37")", |
| u8"LoneLeading=\ufffd, LoneTrailing=\ufffd, " |
| u8"LeadingLeadingTrailing=\ufffd\U00010437"); // Invalid unicode. |
| |
| Compare(R"({"":0,"":0})", Object{{"", 0}}); |
| Compare(R"({"obj":{},"arr":[]})", Object{{"obj", Object{}}, {"arr", {}}}); |
| Compare(R"({"\n":{"\u0000":[[[[]]]]}})", |
| Object{{"\n", Object{ |
| {llvm::StringRef("\0", 1), {{{{}}}}}, |
| }}}); |
| Compare("\r[\n\t] ", {}); |
| } |
| |
| TEST(JSONTest, ParseErrors) { |
| auto ExpectErr = [](llvm::StringRef Msg, llvm::StringRef S) { |
| if (auto E = parse(S)) { |
| // Compare both string forms and with operator==, in case we have bugs. |
| FAIL() << "Parsed JSON >>> " << S << " <<< but wanted error: " << Msg; |
| } else { |
| handleAllErrors(E.takeError(), [S, Msg](const llvm::ErrorInfoBase &E) { |
| EXPECT_THAT(E.message(), testing::HasSubstr(Msg)) << S; |
| }); |
| } |
| }; |
| ExpectErr("Unexpected EOF", ""); |
| ExpectErr("Unexpected EOF", "["); |
| ExpectErr("Text after end of document", "[][]"); |
| ExpectErr("Invalid JSON value (false?)", "fuzzy"); |
| ExpectErr("Expected , or ]", "[2?]"); |
| ExpectErr("Expected object key", "{a:2}"); |
| ExpectErr("Expected : after object key", R"({"a",2})"); |
| ExpectErr("Expected , or } after object property", R"({"a":2 "b":3})"); |
| ExpectErr("Invalid JSON value", R"([&%!])"); |
| ExpectErr("Invalid JSON value (number?)", "1e1.0"); |
| ExpectErr("Unterminated string", R"("abc\"def)"); |
| ExpectErr("Control character in string", "\"abc\ndef\""); |
| ExpectErr("Invalid escape sequence", R"("\030")"); |
| ExpectErr("Invalid \\u escape sequence", R"("\usuck")"); |
| ExpectErr("[3:3, byte=19]", R"({ |
| "valid": 1, |
| invalid: 2 |
| })"); |
| ExpectErr("Invalid UTF-8 sequence", "\"\xC0\x80\""); // WTF-8 null |
| } |
| |
| // Direct tests of isUTF8 and fixUTF8. Internal uses are also tested elsewhere. |
| TEST(JSONTest, UTF8) { |
| for (const char *Valid : { |
| "this is ASCII text", |
| "thïs tëxt häs BMP chäräctërs", |
| "𐌶𐌰L𐌾𐍈 C𐍈𐌼𐌴𐍃", |
| }) { |
| EXPECT_TRUE(isUTF8(Valid)) << Valid; |
| EXPECT_EQ(fixUTF8(Valid), Valid); |
| } |
| for (auto Invalid : std::vector<std::pair<const char *, const char *>>{ |
| {"lone trailing \x81\x82 bytes", "lone trailing �� bytes"}, |
| {"missing trailing \xD0 bytes", "missing trailing � bytes"}, |
| {"truncated character \xD0", "truncated character �"}, |
| {"not \xC1\x80 the \xE0\x9f\xBF shortest \xF0\x83\x83\x83 encoding", |
| "not �� the ��� shortest ���� encoding"}, |
| {"too \xF9\x80\x80\x80\x80 long", "too ����� long"}, |
| {"surrogate \xED\xA0\x80 invalid \xF4\x90\x80\x80", |
| "surrogate ��� invalid ����"}}) { |
| EXPECT_FALSE(isUTF8(Invalid.first)) << Invalid.first; |
| EXPECT_EQ(fixUTF8(Invalid.first), Invalid.second); |
| } |
| } |
| |
| TEST(JSONTest, Inspection) { |
| llvm::Expected<Value> Doc = parse(R"( |
| { |
| "null": null, |
| "boolean": false, |
| "number": 2.78, |
| "string": "json", |
| "array": [null, true, 3.14, "hello", [1,2,3], {"time": "arrow"}], |
| "object": {"fruit": "banana"} |
| } |
| )"); |
| EXPECT_TRUE(!!Doc); |
| |
| Object *O = Doc->getAsObject(); |
| ASSERT_TRUE(O); |
| |
| EXPECT_FALSE(O->getNull("missing")); |
| EXPECT_FALSE(O->getNull("boolean")); |
| EXPECT_TRUE(O->getNull("null")); |
| |
| EXPECT_EQ(O->getNumber("number"), llvm::Optional<double>(2.78)); |
| EXPECT_FALSE(O->getInteger("number")); |
| EXPECT_EQ(O->getString("string"), llvm::Optional<llvm::StringRef>("json")); |
| ASSERT_FALSE(O->getObject("missing")); |
| ASSERT_FALSE(O->getObject("array")); |
| ASSERT_TRUE(O->getObject("object")); |
| EXPECT_EQ(*O->getObject("object"), (Object{{"fruit", "banana"}})); |
| |
| Array *A = O->getArray("array"); |
| ASSERT_TRUE(A); |
| EXPECT_EQ((*A)[1].getAsBoolean(), llvm::Optional<bool>(true)); |
| ASSERT_TRUE((*A)[4].getAsArray()); |
| EXPECT_EQ(*(*A)[4].getAsArray(), (Array{1, 2, 3})); |
| EXPECT_EQ((*(*A)[4].getAsArray())[1].getAsInteger(), |
| llvm::Optional<int64_t>(2)); |
| int I = 0; |
| for (Value &E : *A) { |
| if (I++ == 5) { |
| ASSERT_TRUE(E.getAsObject()); |
| EXPECT_EQ(E.getAsObject()->getString("time"), |
| llvm::Optional<llvm::StringRef>("arrow")); |
| } else |
| EXPECT_FALSE(E.getAsObject()); |
| } |
| } |
| |
| // Verify special integer handling - we try to preserve exact int64 values. |
| TEST(JSONTest, Integers) { |
| struct { |
| const char *Desc; |
| Value Val; |
| const char *Str; |
| llvm::Optional<int64_t> AsInt; |
| llvm::Optional<double> AsNumber; |
| } TestCases[] = { |
| { |
| "Non-integer. Stored as double, not convertible.", |
| double{1.5}, |
| "1.5", |
| llvm::None, |
| 1.5, |
| }, |
| |
| { |
| "Integer, not exact double. Stored as int64, convertible.", |
| int64_t{0x4000000000000001}, |
| "4611686018427387905", |
| int64_t{0x4000000000000001}, |
| double{0x4000000000000000}, |
| }, |
| |
| { |
| "Negative integer, not exact double. Stored as int64, convertible.", |
| int64_t{-0x4000000000000001}, |
| "-4611686018427387905", |
| int64_t{-0x4000000000000001}, |
| double{-0x4000000000000000}, |
| }, |
| |
| { |
| "Dynamically exact integer. Stored as double, convertible.", |
| double{0x6000000000000000}, |
| "6.9175290276410819e+18", |
| int64_t{0x6000000000000000}, |
| double{0x6000000000000000}, |
| }, |
| |
| { |
| "Dynamically integer, >64 bits. Stored as double, not convertible.", |
| 1.5 * double{0x8000000000000000}, |
| "1.3835058055282164e+19", |
| llvm::None, |
| 1.5 * double{0x8000000000000000}, |
| }, |
| }; |
| for (const auto &T : TestCases) { |
| EXPECT_EQ(T.Str, s(T.Val)) << T.Desc; |
| llvm::Expected<Value> Doc = parse(T.Str); |
| EXPECT_TRUE(!!Doc) << T.Desc; |
| EXPECT_EQ(Doc->getAsInteger(), T.AsInt) << T.Desc; |
| EXPECT_EQ(Doc->getAsNumber(), T.AsNumber) << T.Desc; |
| EXPECT_EQ(T.Val, *Doc) << T.Desc; |
| EXPECT_EQ(T.Str, s(*Doc)) << T.Desc; |
| } |
| } |
| |
| // Sample struct with typical JSON-mapping rules. |
| struct CustomStruct { |
| CustomStruct() : B(false) {} |
| CustomStruct(std::string S, llvm::Optional<int> I, bool B) |
| : S(S), I(I), B(B) {} |
| std::string S; |
| llvm::Optional<int> I; |
| bool B; |
| }; |
| inline bool operator==(const CustomStruct &L, const CustomStruct &R) { |
| return L.S == R.S && L.I == R.I && L.B == R.B; |
| } |
| inline llvm::raw_ostream &operator<<(llvm::raw_ostream &OS, |
| const CustomStruct &S) { |
| return OS << "(" << S.S << ", " << (S.I ? std::to_string(*S.I) : "None") |
| << ", " << S.B << ")"; |
| } |
| bool fromJSON(const Value &E, CustomStruct &R) { |
| ObjectMapper O(E); |
| if (!O || !O.map("str", R.S) || !O.map("int", R.I)) |
| return false; |
| O.map("bool", R.B); |
| return true; |
| } |
| |
| TEST(JSONTest, Deserialize) { |
| std::map<std::string, std::vector<CustomStruct>> R; |
| CustomStruct ExpectedStruct = {"foo", 42, true}; |
| std::map<std::string, std::vector<CustomStruct>> Expected; |
| Value J = Object{ |
| {"foo", |
| Array{ |
| Object{ |
| {"str", "foo"}, |
| {"int", 42}, |
| {"bool", true}, |
| {"unknown", "ignored"}, |
| }, |
| Object{{"str", "bar"}}, |
| Object{ |
| {"str", "baz"}, {"bool", "string"}, // OK, deserialize ignores. |
| }, |
| }}}; |
| Expected["foo"] = { |
| CustomStruct("foo", 42, true), |
| CustomStruct("bar", llvm::None, false), |
| CustomStruct("baz", llvm::None, false), |
| }; |
| ASSERT_TRUE(fromJSON(J, R)); |
| EXPECT_EQ(R, Expected); |
| |
| CustomStruct V; |
| EXPECT_FALSE(fromJSON(nullptr, V)) << "Not an object " << V; |
| EXPECT_FALSE(fromJSON(Object{}, V)) << "Missing required field " << V; |
| EXPECT_FALSE(fromJSON(Object{{"str", 1}}, V)) << "Wrong type " << V; |
| // Optional<T> must parse as the correct type if present. |
| EXPECT_FALSE(fromJSON(Object{{"str", 1}, {"int", "string"}}, V)) |
| << "Wrong type for Optional<T> " << V; |
| } |
| |
| } // namespace |
| } // namespace json |
| } // namespace llvm |