1 // Copyright 2012 The Chromium Authors
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "base/json/json_reader.h"
6
7 #include <stddef.h>
8
9 #include <cmath>
10 #include <utility>
11
12 #include "base/base_paths.h"
13 #include "base/features.h"
14 #include "base/files/file_util.h"
15 #include "base/logging.h"
16 #include "base/path_service.h"
17 #include "base/rust_buildflags.h"
18 #include "base/strings/string_piece.h"
19 #include "base/strings/stringprintf.h"
20 #include "base/strings/utf_string_conversions.h"
21 #include "base/test/gmock_expected_support.h"
22 #include "base/test/metrics/histogram_tester.h"
23 #include "base/test/scoped_feature_list.h"
24 #include "base/values.h"
25 #include "build/build_config.h"
26 #include "testing/gmock/include/gmock/gmock.h"
27 #include "testing/gtest/include/gtest/gtest.h"
28 #include "third_party/abseil-cpp/absl/types/optional.h"
29
30 namespace {
31
32 // MSan will do a better job detecting over-read errors if the input is not
33 // nul-terminated on the heap. This will copy |input| to a new buffer owned by
34 // |owner|, returning a base::StringPiece to |owner|.
MakeNotNullTerminatedInput(const char * input,std::unique_ptr<char[]> * owner)35 base::StringPiece MakeNotNullTerminatedInput(const char* input,
36 std::unique_ptr<char[]>* owner) {
37 size_t str_len = strlen(input);
38 owner->reset(new char[str_len]);
39 memcpy(owner->get(), input, str_len);
40 return base::StringPiece(owner->get(), str_len);
41 }
42
43 } // namespace
44
45 namespace base {
46
47 class JSONReaderTest : public testing::TestWithParam<bool> {
48 public:
SetUp()49 void SetUp() override {
50 feature_list_.InitWithFeatureState(base::features::kUseRustJsonParser,
51 using_rust_);
52 }
53
54 protected:
55 bool using_rust_ = GetParam();
56 base::test::ScopedFeatureList feature_list_;
57 };
58
TEST_P(JSONReaderTest,Whitespace)59 TEST_P(JSONReaderTest, Whitespace) {
60 absl::optional<Value> root = JSONReader::Read(" null ");
61 ASSERT_TRUE(root);
62 EXPECT_TRUE(root->is_none());
63 }
64
TEST_P(JSONReaderTest,InvalidString)65 TEST_P(JSONReaderTest, InvalidString) {
66 // These are invalid because they do not represent a JSON value,
67 // see https://tools.ietf.org/rfc/rfc8259.txt
68 EXPECT_FALSE(JSONReader::Read(""));
69 EXPECT_FALSE(JSONReader::Read("nu"));
70 }
71
TEST_P(JSONReaderTest,SimpleBool)72 TEST_P(JSONReaderTest, SimpleBool) {
73 #if BUILDFLAG(BUILD_RUST_JSON_READER)
74 base::HistogramTester histograms;
75 #endif // BUILDFLAG(BUILD_RUST_JSON_READER)
76 absl::optional<Value> root = JSONReader::Read("true ");
77 ASSERT_TRUE(root);
78 EXPECT_TRUE(root->is_bool());
79 #if BUILDFLAG(BUILD_RUST_JSON_READER)
80 histograms.ExpectTotalCount("Security.JSONParser.ParsingTime", 1);
81 #endif // BUILDFLAG(BUILD_RUST_JSON_READER)
82 }
83
TEST_P(JSONReaderTest,EmbeddedComments)84 TEST_P(JSONReaderTest, EmbeddedComments) {
85 absl::optional<Value> root = JSONReader::Read("/* comment */null");
86 ASSERT_TRUE(root);
87 EXPECT_TRUE(root->is_none());
88 root = JSONReader::Read("40 /* comment */");
89 ASSERT_TRUE(root);
90 EXPECT_TRUE(root->is_int());
91 root = JSONReader::Read("true // comment");
92 ASSERT_TRUE(root);
93 EXPECT_TRUE(root->is_bool());
94 // Comments in different contexts.
95 root = JSONReader::Read("{ \"cheese\": 3\n\n // Here's a comment\n}");
96 ASSERT_TRUE(root);
97 EXPECT_TRUE(root->is_dict());
98 root = JSONReader::Read("{ \"cheese\": 3// Here's a comment\n}");
99 ASSERT_TRUE(root);
100 EXPECT_TRUE(root->is_dict());
101 // Multiple comment markers.
102 root = JSONReader::Read(
103 "{ \"cheese\": 3// Here's a comment // and another\n}");
104 ASSERT_TRUE(root);
105 EXPECT_TRUE(root->is_dict());
106 root = JSONReader::Read("/* comment */\"sample string\"");
107 ASSERT_TRUE(root);
108 ASSERT_TRUE(root->is_string());
109 EXPECT_EQ("sample string", root->GetString());
110 root = JSONReader::Read("[1, /* comment, 2 ] */ \n 3]");
111 ASSERT_TRUE(root);
112 Value::List* list = root->GetIfList();
113 ASSERT_TRUE(list);
114 ASSERT_EQ(2u, list->size());
115 ASSERT_TRUE((*list)[0].is_int());
116 EXPECT_EQ(1, (*list)[0].GetInt());
117 ASSERT_TRUE((*list)[1].is_int());
118 EXPECT_EQ(3, (*list)[1].GetInt());
119 root = JSONReader::Read("[1, /*a*/2, 3]");
120 ASSERT_TRUE(root);
121 list = root->GetIfList();
122 ASSERT_TRUE(list);
123 EXPECT_EQ(3u, (*list).size());
124 root = JSONReader::Read("/* comment **/42");
125 ASSERT_TRUE(root);
126 ASSERT_TRUE(root->is_int());
127 EXPECT_EQ(42, root->GetInt());
128 root = JSONReader::Read(
129 "/* comment **/\n"
130 "// */ 43\n"
131 "44");
132 ASSERT_TRUE(root);
133 EXPECT_TRUE(root->is_int());
134 EXPECT_EQ(44, root->GetInt());
135
136 // At one point, this parsed successfully as the value three.
137 EXPECT_FALSE(JSONReader::Read("/33"));
138 }
139
TEST_P(JSONReaderTest,Ints)140 TEST_P(JSONReaderTest, Ints) {
141 absl::optional<Value> root = JSONReader::Read("43");
142 ASSERT_TRUE(root);
143 ASSERT_TRUE(root->is_int());
144 EXPECT_EQ(43, root->GetInt());
145 }
146
TEST_P(JSONReaderTest,NonDecimalNumbers)147 TEST_P(JSONReaderTest, NonDecimalNumbers) {
148 // According to RFC 8259, oct, hex, and leading zeros are invalid JSON.
149 EXPECT_FALSE(JSONReader::Read("043"));
150 EXPECT_FALSE(JSONReader::Read("0x43"));
151 EXPECT_FALSE(JSONReader::Read("00"));
152 }
153
TEST_P(JSONReaderTest,NumberZero)154 TEST_P(JSONReaderTest, NumberZero) {
155 // Test 0 (which needs to be special cased because of the leading zero
156 // clause).
157 absl::optional<Value> root = JSONReader::Read("0");
158 ASSERT_TRUE(root);
159 ASSERT_TRUE(root->is_int());
160 EXPECT_EQ(0, root->GetInt());
161 }
162
TEST_P(JSONReaderTest,LargeIntPromotion)163 TEST_P(JSONReaderTest, LargeIntPromotion) {
164 // Numbers that overflow ints should succeed, being internally promoted to
165 // storage as doubles
166 absl::optional<Value> root = JSONReader::Read("2147483648");
167 ASSERT_TRUE(root);
168 EXPECT_TRUE(root->is_double());
169 EXPECT_DOUBLE_EQ(2147483648.0, root->GetDouble());
170 root = JSONReader::Read("-2147483649");
171 ASSERT_TRUE(root);
172 EXPECT_TRUE(root->is_double());
173 EXPECT_DOUBLE_EQ(-2147483649.0, root->GetDouble());
174 }
175
TEST_P(JSONReaderTest,LargerIntIsLossy)176 TEST_P(JSONReaderTest, LargerIntIsLossy) {
177 // Parse LONG_MAX as a JSON number (not a JSON string). The result of the
178 // parse is a base::Value, either a (32-bit) int or a (64-bit) double.
179 // LONG_MAX would overflow an int and can only be approximated by a double.
180 // In this case, parsing is lossy.
181 const char* etc807 = "9223372036854775807";
182 const char* etc808 = "9223372036854775808.000000";
183 absl::optional<Value> root = JSONReader::Read(etc807);
184 ASSERT_TRUE(root);
185 ASSERT_FALSE(root->is_int());
186 ASSERT_TRUE(root->is_double());
187 // We use StringPrintf instead of NumberToString, because the NumberToString
188 // function does not let you specify the precision, and its default output,
189 // "9.223372036854776e+18", isn't precise enough to see the lossiness.
190 EXPECT_EQ(std::string(etc808), StringPrintf("%f", root->GetDouble()));
191 }
192
TEST_P(JSONReaderTest,Doubles)193 TEST_P(JSONReaderTest, Doubles) {
194 absl::optional<Value> root = JSONReader::Read("43.1");
195 ASSERT_TRUE(root);
196 EXPECT_TRUE(root->is_double());
197 EXPECT_DOUBLE_EQ(43.1, root->GetDouble());
198
199 root = JSONReader::Read("4.3e-1");
200 ASSERT_TRUE(root);
201 EXPECT_TRUE(root->is_double());
202 EXPECT_DOUBLE_EQ(.43, root->GetDouble());
203
204 root = JSONReader::Read("2.1e0");
205 ASSERT_TRUE(root);
206 EXPECT_TRUE(root->is_double());
207 EXPECT_DOUBLE_EQ(2.1, root->GetDouble());
208
209 root = JSONReader::Read("2.1e+0001");
210 ASSERT_TRUE(root);
211 EXPECT_TRUE(root->is_double());
212 EXPECT_DOUBLE_EQ(21.0, root->GetDouble());
213
214 root = JSONReader::Read("0.01");
215 ASSERT_TRUE(root);
216 EXPECT_TRUE(root->is_double());
217 EXPECT_DOUBLE_EQ(0.01, root->GetDouble());
218
219 root = JSONReader::Read("1.00");
220 ASSERT_TRUE(root);
221 EXPECT_TRUE(root->is_double());
222 EXPECT_DOUBLE_EQ(1.0, root->GetDouble());
223
224 // Some "parse to float64" implementations find this one tricky.
225 // https://github.com/serde-rs/json/issues/707
226 root = JSONReader::Read("122.416294033786585");
227 ASSERT_TRUE(root);
228 EXPECT_TRUE(root->is_double());
229 EXPECT_DOUBLE_EQ(122.416294033786585, root->GetDouble());
230
231 // This is syntaxtically valid, but out of range of a double.
232 auto value =
233 JSONReader::ReadAndReturnValueWithError("1e1000", JSON_PARSE_RFC);
234 ASSERT_FALSE(value.has_value());
235 }
236
TEST_P(JSONReaderTest,FractionalNumbers)237 TEST_P(JSONReaderTest, FractionalNumbers) {
238 // Fractional parts must have a digit before and after the decimal point.
239 EXPECT_FALSE(JSONReader::Read("1."));
240 EXPECT_FALSE(JSONReader::Read(".1"));
241 EXPECT_FALSE(JSONReader::Read("1.e10"));
242 }
243
TEST_P(JSONReaderTest,ExponentialNumbers)244 TEST_P(JSONReaderTest, ExponentialNumbers) {
245 // Exponent must have a digit following the 'e'.
246 EXPECT_FALSE(JSONReader::Read("1e"));
247 EXPECT_FALSE(JSONReader::Read("1E"));
248 EXPECT_FALSE(JSONReader::Read("1e1."));
249 EXPECT_FALSE(JSONReader::Read("1e1.0"));
250 }
251
TEST_P(JSONReaderTest,InvalidInfNAN)252 TEST_P(JSONReaderTest, InvalidInfNAN) {
253 // The largest finite double is roughly 1.8e308.
254 EXPECT_FALSE(JSONReader::Read("1e1000"));
255 EXPECT_FALSE(JSONReader::Read("-1e1000"));
256 EXPECT_FALSE(JSONReader::Read("NaN"));
257 EXPECT_FALSE(JSONReader::Read("nan"));
258 EXPECT_FALSE(JSONReader::Read("inf"));
259 }
260
TEST_P(JSONReaderTest,InvalidNumbers)261 TEST_P(JSONReaderTest, InvalidNumbers) {
262 EXPECT_TRUE(JSONReader::Read("4.3"));
263 EXPECT_FALSE(JSONReader::Read("4."));
264 EXPECT_FALSE(JSONReader::Read("4.3.1"));
265 EXPECT_FALSE(JSONReader::Read("4e3.1"));
266 EXPECT_FALSE(JSONReader::Read("4.a"));
267 EXPECT_FALSE(JSONReader::Read("42a"));
268 }
269
TEST_P(JSONReaderTest,Zeroes)270 TEST_P(JSONReaderTest, Zeroes) {
271 absl::optional<Value> root = JSONReader::Read("0");
272 ASSERT_TRUE(root);
273 EXPECT_TRUE(root->is_int());
274 EXPECT_DOUBLE_EQ(0, root->GetInt());
275
276 root = JSONReader::Read("0.0");
277 ASSERT_TRUE(root);
278 EXPECT_TRUE(root->is_double());
279 EXPECT_DOUBLE_EQ(0.0, root->GetDouble());
280 EXPECT_FALSE(std::signbit(root->GetDouble()));
281
282 root = JSONReader::Read("-0");
283 ASSERT_TRUE(root);
284 EXPECT_TRUE(root->is_double());
285 EXPECT_DOUBLE_EQ(0.0, root->GetDouble());
286 EXPECT_TRUE(std::signbit(root->GetDouble()));
287
288 root = JSONReader::Read("-0.0");
289 ASSERT_TRUE(root);
290 EXPECT_TRUE(root->is_double());
291 EXPECT_DOUBLE_EQ(-0.0, root->GetDouble());
292 EXPECT_TRUE(std::signbit(root->GetDouble()));
293 }
294
TEST_P(JSONReaderTest,SimpleString)295 TEST_P(JSONReaderTest, SimpleString) {
296 absl::optional<Value> root = JSONReader::Read("\"hello world\"");
297 ASSERT_TRUE(root);
298 ASSERT_TRUE(root->is_string());
299 EXPECT_EQ("hello world", root->GetString());
300 }
301
TEST_P(JSONReaderTest,EmptyString)302 TEST_P(JSONReaderTest, EmptyString) {
303 absl::optional<Value> root = JSONReader::Read("\"\"");
304 ASSERT_TRUE(root);
305 ASSERT_TRUE(root->is_string());
306 EXPECT_EQ("", root->GetString());
307 }
308
TEST_P(JSONReaderTest,BasicStringEscapes)309 TEST_P(JSONReaderTest, BasicStringEscapes) {
310 absl::optional<Value> root =
311 JSONReader::Read("\" \\\"\\\\\\/\\b\\f\\n\\r\\t\\v\"");
312 ASSERT_TRUE(root);
313 ASSERT_TRUE(root->is_string());
314 EXPECT_EQ(" \"\\/\b\f\n\r\t\v", root->GetString());
315 }
316
TEST_P(JSONReaderTest,UnicodeEscapes)317 TEST_P(JSONReaderTest, UnicodeEscapes) {
318 // Test hex and unicode escapes including the null character.
319 absl::optional<Value> root =
320 JSONReader::Read("\"\\x41\\xFF\\x00\\u1234\\u0000\"");
321 ASSERT_TRUE(root);
322 ASSERT_TRUE(root->is_string());
323 const std::string& str_val = root->GetString();
324 EXPECT_EQ(std::wstring(L"A\x00FF\0\x1234\0", 5), UTF8ToWide(str_val));
325
326 // The contents of a Unicode escape may only be four hex chars. Previously the
327 // parser accepted things like "0x01" and "0X01".
328 EXPECT_FALSE(JSONReader::Read("\"\\u0x12\""));
329
330 // Surrogate pairs are allowed in JSON.
331 EXPECT_TRUE(JSONReader::Read("\"\\uD834\\uDD1E\"")); // U+1D11E
332 }
333
TEST_P(JSONReaderTest,InvalidStrings)334 TEST_P(JSONReaderTest, InvalidStrings) {
335 EXPECT_FALSE(JSONReader::Read("\"no closing quote"));
336 EXPECT_FALSE(JSONReader::Read("\"\\z invalid escape char\""));
337 EXPECT_FALSE(JSONReader::Read("\"\\xAQ invalid hex code\""));
338 EXPECT_FALSE(JSONReader::Read("not enough hex chars\\x1\""));
339 EXPECT_FALSE(JSONReader::Read("\"not enough escape chars\\u123\""));
340 EXPECT_FALSE(JSONReader::Read("\"extra backslash at end of input\\\""));
341 }
342
TEST_P(JSONReaderTest,BasicArray)343 TEST_P(JSONReaderTest, BasicArray) {
344 absl::optional<Value> root = JSONReader::Read("[true, false, null]");
345 ASSERT_TRUE(root);
346 Value::List* list = root->GetIfList();
347 ASSERT_TRUE(list);
348 EXPECT_EQ(3U, list->size());
349
350 // Test with trailing comma. Should be parsed the same as above.
351 absl::optional<Value> root2 =
352 JSONReader::Read("[true, false, null, ]", JSON_ALLOW_TRAILING_COMMAS);
353 ASSERT_TRUE(root2);
354 EXPECT_EQ(*list, *root2);
355 }
356
TEST_P(JSONReaderTest,EmptyArray)357 TEST_P(JSONReaderTest, EmptyArray) {
358 absl::optional<Value> value = JSONReader::Read("[]");
359 ASSERT_TRUE(value);
360 Value::List* list = value->GetIfList();
361 ASSERT_TRUE(list);
362 EXPECT_TRUE(list->empty());
363 }
364
TEST_P(JSONReaderTest,CompleteArray)365 TEST_P(JSONReaderTest, CompleteArray) {
366 absl::optional<Value> value = JSONReader::Read("[\"a\", 3, 4.56, null]");
367 ASSERT_TRUE(value);
368 Value::List* list = value->GetIfList();
369 ASSERT_TRUE(list);
370 EXPECT_EQ(4U, list->size());
371 }
372
TEST_P(JSONReaderTest,NestedArrays)373 TEST_P(JSONReaderTest, NestedArrays) {
374 absl::optional<Value> value = JSONReader::Read(
375 "[[true], [], {\"smell\": \"nice\",\"taste\": \"yummy\" }, [false, [], "
376 "[null]], null]");
377 ASSERT_TRUE(value);
378 Value::List* list = value->GetIfList();
379 ASSERT_TRUE(list);
380 EXPECT_EQ(5U, list->size());
381
382 // Lots of trailing commas.
383 absl::optional<Value> root2 = JSONReader::Read(
384 "[[true], [], {\"smell\": \"nice\",\"taste\": \"yummy\" }, [false, [], "
385 "[null, ] , ], null,]",
386 JSON_ALLOW_TRAILING_COMMAS);
387 ASSERT_TRUE(root2);
388 EXPECT_EQ(*list, *root2);
389 }
390
TEST_P(JSONReaderTest,InvalidArrays)391 TEST_P(JSONReaderTest, InvalidArrays) {
392 // Missing close brace.
393 EXPECT_FALSE(JSONReader::Read("[[true], [], [false, [], [null]], null"));
394
395 // Too many commas.
396 EXPECT_FALSE(JSONReader::Read("[true,, null]"));
397 EXPECT_FALSE(JSONReader::Read("[true,, null]", JSON_ALLOW_TRAILING_COMMAS));
398
399 // No commas.
400 EXPECT_FALSE(JSONReader::Read("[true null]"));
401
402 // Trailing comma.
403 EXPECT_FALSE(JSONReader::Read("[true,]"));
404 }
405
TEST_P(JSONReaderTest,ArrayTrailingComma)406 TEST_P(JSONReaderTest, ArrayTrailingComma) {
407 // Valid if we set |allow_trailing_comma| to true.
408 absl::optional<Value> value =
409 JSONReader::Read("[true,]", JSON_ALLOW_TRAILING_COMMAS);
410 ASSERT_TRUE(value);
411 Value::List* list = value->GetIfList();
412 ASSERT_TRUE(list);
413 ASSERT_EQ(1U, list->size());
414 const Value& value1 = (*list)[0];
415 ASSERT_TRUE(value1.is_bool());
416 EXPECT_TRUE(value1.GetBool());
417 }
418
TEST_P(JSONReaderTest,ArrayTrailingCommaNoEmptyElements)419 TEST_P(JSONReaderTest, ArrayTrailingCommaNoEmptyElements) {
420 // Don't allow empty elements, even if |allow_trailing_comma| is
421 // true.
422 EXPECT_FALSE(JSONReader::Read("[,]", JSON_ALLOW_TRAILING_COMMAS));
423 EXPECT_FALSE(JSONReader::Read("[true,,]", JSON_ALLOW_TRAILING_COMMAS));
424 EXPECT_FALSE(JSONReader::Read("[,true,]", JSON_ALLOW_TRAILING_COMMAS));
425 EXPECT_FALSE(JSONReader::Read("[true,,false]", JSON_ALLOW_TRAILING_COMMAS));
426 }
427
TEST_P(JSONReaderTest,EmptyDictionary)428 TEST_P(JSONReaderTest, EmptyDictionary) {
429 absl::optional<Value> dict_val = JSONReader::Read("{}");
430 ASSERT_TRUE(dict_val);
431 ASSERT_TRUE(dict_val->is_dict());
432 }
433
TEST_P(JSONReaderTest,CompleteDictionary)434 TEST_P(JSONReaderTest, CompleteDictionary) {
435 absl::optional<Value> root1 = JSONReader::Read(
436 "{\"number\":9.87654321, \"null\":null , \"\\x53\" : \"str\", \"bool\": "
437 "false, \"more\": {} }");
438 ASSERT_TRUE(root1);
439 const Value::Dict* root1_dict = root1->GetIfDict();
440 ASSERT_TRUE(root1_dict);
441 auto double_val = root1_dict->FindDouble("number");
442 ASSERT_TRUE(double_val);
443 EXPECT_DOUBLE_EQ(9.87654321, *double_val);
444 const Value* null_val = root1_dict->Find("null");
445 ASSERT_TRUE(null_val);
446 EXPECT_TRUE(null_val->is_none());
447 const std::string* str_val = root1_dict->FindString("S");
448 ASSERT_TRUE(str_val);
449 EXPECT_EQ("str", *str_val);
450 auto bool_val = root1_dict->FindBool("bool");
451 ASSERT_TRUE(bool_val);
452 ASSERT_FALSE(*bool_val);
453
454 absl::optional<Value> root2 = JSONReader::Read(
455 "{\"number\":9.87654321, \"null\":null , \"\\x53\" : \"str\", \"bool\": "
456 "false, \"more\": {},}",
457 JSON_PARSE_CHROMIUM_EXTENSIONS | JSON_ALLOW_TRAILING_COMMAS);
458 ASSERT_TRUE(root2);
459 Value::Dict* root2_dict = root2->GetIfDict();
460 ASSERT_TRUE(root2_dict);
461 EXPECT_EQ(*root1_dict, *root2_dict);
462
463 // Test newline equivalence.
464 root2 = JSONReader::Read(
465 "{\n"
466 " \"number\":9.87654321,\n"
467 " \"null\":null,\n"
468 " \"\\x53\":\"str\",\n"
469 " \"bool\": false,\n"
470 " \"more\": {},\n"
471 "}\n",
472 JSON_PARSE_CHROMIUM_EXTENSIONS | JSON_ALLOW_TRAILING_COMMAS);
473 ASSERT_TRUE(root2);
474 root2_dict = root2->GetIfDict();
475 ASSERT_TRUE(root2);
476 EXPECT_EQ(*root1_dict, *root2_dict);
477
478 root2 = JSONReader::Read(
479 "{\r\n"
480 " \"number\":9.87654321,\r\n"
481 " \"null\":null,\r\n"
482 " \"\\x53\":\"str\",\r\n"
483 " \"bool\": false,\r\n"
484 " \"more\": {},\r\n"
485 "}\r\n",
486 JSON_PARSE_CHROMIUM_EXTENSIONS | JSON_ALLOW_TRAILING_COMMAS);
487 ASSERT_TRUE(root2);
488 root2_dict = root2->GetIfDict();
489 ASSERT_TRUE(root2_dict);
490 EXPECT_EQ(*root1_dict, *root2_dict);
491 }
492
TEST_P(JSONReaderTest,NestedDictionaries)493 TEST_P(JSONReaderTest, NestedDictionaries) {
494 absl::optional<Value> root1 = JSONReader::Read(
495 "{\"inner\":{\"array\":[true, 3, 4.56, null]},\"false\":false,\"d\":{}}");
496 ASSERT_TRUE(root1);
497 const base::Value::Dict* root1_dict = root1->GetIfDict();
498 ASSERT_TRUE(root1_dict);
499 const Value::Dict* inner_dict = root1_dict->FindDict("inner");
500 ASSERT_TRUE(inner_dict);
501 const Value::List* inner_array = inner_dict->FindList("array");
502 ASSERT_TRUE(inner_array);
503 EXPECT_EQ(4U, inner_array->size());
504 auto bool_value = root1_dict->FindBool("false");
505 ASSERT_TRUE(bool_value);
506 EXPECT_FALSE(*bool_value);
507 inner_dict = root1_dict->FindDict("d");
508 EXPECT_TRUE(inner_dict);
509
510 absl::optional<Value> root2 = JSONReader::Read(
511 "{\"inner\": {\"array\":[true, 3, 4.56, null] , "
512 "},\"false\":false,\"d\":{},}",
513 JSON_ALLOW_TRAILING_COMMAS);
514 ASSERT_TRUE(root2);
515 EXPECT_EQ(*root1_dict, *root2);
516 }
517
TEST_P(JSONReaderTest,DictionaryKeysWithPeriods)518 TEST_P(JSONReaderTest, DictionaryKeysWithPeriods) {
519 absl::optional<Value> root =
520 JSONReader::Read("{\"a.b\":3,\"c\":2,\"d.e.f\":{\"g.h.i.j\":1}}");
521 ASSERT_TRUE(root);
522 Value::Dict* root_dict = root->GetIfDict();
523 ASSERT_TRUE(root_dict);
524
525 auto integer_value = root_dict->FindInt("a.b");
526 ASSERT_TRUE(integer_value);
527 EXPECT_EQ(3, *integer_value);
528 integer_value = root_dict->FindInt("c");
529 ASSERT_TRUE(integer_value);
530 EXPECT_EQ(2, *integer_value);
531 const Value::Dict* inner_dict = root_dict->FindDict("d.e.f");
532 ASSERT_TRUE(inner_dict);
533 EXPECT_EQ(1U, inner_dict->size());
534 integer_value = inner_dict->FindInt("g.h.i.j");
535 ASSERT_TRUE(integer_value);
536 EXPECT_EQ(1, *integer_value);
537
538 root = JSONReader::Read("{\"a\":{\"b\":2},\"a.b\":1}");
539 ASSERT_TRUE(root);
540 root_dict = root->GetIfDict();
541 ASSERT_TRUE(root_dict);
542 const Value* integer_path_value = root_dict->FindByDottedPath("a.b");
543 ASSERT_TRUE(integer_path_value);
544 EXPECT_EQ(2, integer_path_value->GetInt());
545 integer_value = root_dict->FindInt("a.b");
546 ASSERT_TRUE(integer_value);
547 EXPECT_EQ(1, *integer_value);
548 }
549
TEST_P(JSONReaderTest,DuplicateKeys)550 TEST_P(JSONReaderTest, DuplicateKeys) {
551 absl::optional<Value> root = JSONReader::Read("{\"x\":1,\"x\":2,\"y\":3}");
552 ASSERT_TRUE(root);
553 const Value::Dict* root_dict = root->GetIfDict();
554 ASSERT_TRUE(root_dict);
555
556 auto integer_value = root_dict->FindInt("x");
557 ASSERT_TRUE(integer_value);
558 EXPECT_EQ(2, *integer_value);
559 }
560
TEST_P(JSONReaderTest,InvalidDictionaries)561 TEST_P(JSONReaderTest, InvalidDictionaries) {
562 // No closing brace.
563 EXPECT_FALSE(JSONReader::Read("{\"a\": true"));
564
565 // Keys must be quoted strings.
566 EXPECT_FALSE(JSONReader::Read("{foo:true}"));
567 EXPECT_FALSE(JSONReader::Read("{1234: false}"));
568 EXPECT_FALSE(JSONReader::Read("{:false}"));
569 EXPECT_FALSE(JSONReader::Read("{ , }"));
570
571 // Trailing comma.
572 EXPECT_FALSE(JSONReader::Read("{\"a\":true,}"));
573
574 // Too many commas.
575 EXPECT_FALSE(JSONReader::Read("{\"a\":true,,\"b\":false}"));
576 EXPECT_FALSE(JSONReader::Read("{\"a\":true,,\"b\":false}",
577 JSON_ALLOW_TRAILING_COMMAS));
578
579 // No separator.
580 EXPECT_FALSE(JSONReader::Read("{\"a\" \"b\"}"));
581
582 // Lone comma.
583 EXPECT_FALSE(JSONReader::Read("{,}"));
584 EXPECT_FALSE(JSONReader::Read("{,}", JSON_ALLOW_TRAILING_COMMAS));
585 EXPECT_FALSE(JSONReader::Read("{\"a\":true,,}", JSON_ALLOW_TRAILING_COMMAS));
586 EXPECT_FALSE(JSONReader::Read("{,\"a\":true}", JSON_ALLOW_TRAILING_COMMAS));
587 EXPECT_FALSE(JSONReader::Read("{\"a\":true,,\"b\":false}",
588 JSON_ALLOW_TRAILING_COMMAS));
589 }
590
TEST_P(JSONReaderTest,StackOverflow)591 TEST_P(JSONReaderTest, StackOverflow) {
592 std::string evil(1000000, '[');
593 evil.append(std::string(1000000, ']'));
594 EXPECT_FALSE(JSONReader::Read(evil));
595
596 // A few thousand adjacent lists is fine.
597 std::string not_evil("[");
598 not_evil.reserve(15010);
599 for (int i = 0; i < 5000; ++i)
600 not_evil.append("[],");
601 not_evil.append("[]]");
602 absl::optional<Value> value = JSONReader::Read(not_evil);
603 ASSERT_TRUE(value);
604 Value::List* list = value->GetIfList();
605 ASSERT_TRUE(list);
606 EXPECT_EQ(5001U, list->size());
607 }
608
TEST_P(JSONReaderTest,UTF8Input)609 TEST_P(JSONReaderTest, UTF8Input) {
610 absl::optional<Value> root = JSONReader::Read("\"\xe7\xbd\x91\xe9\xa1\xb5\"");
611 ASSERT_TRUE(root);
612 ASSERT_TRUE(root->is_string());
613 const std::string& str_val = root->GetString();
614 EXPECT_EQ(L"\x7f51\x9875", UTF8ToWide(str_val));
615
616 root = JSONReader::Read("{\"path\": \"/tmp/\xc3\xa0\xc3\xa8\xc3\xb2.png\"}");
617 ASSERT_TRUE(root);
618 const Value::Dict* root_dict = root->GetIfDict();
619 ASSERT_TRUE(root_dict);
620 const std::string* maybe_string = root_dict->FindString("path");
621 ASSERT_TRUE(maybe_string);
622 EXPECT_EQ("/tmp/\xC3\xA0\xC3\xA8\xC3\xB2.png", *maybe_string);
623
624 // JSON can encode non-characters.
625 const char* const noncharacters[] = {
626 "\"\xEF\xB7\x90\"", // U+FDD0
627 "\"\xEF\xB7\x9F\"", // U+FDDF
628 "\"\xEF\xB7\xAF\"", // U+FDEF
629 "\"\xEF\xBF\xBE\"", // U+FFFE
630 "\"\xEF\xBF\xBF\"", // U+FFFF
631 "\"\xF0\x9F\xBF\xBE\"", // U+01FFFE
632 "\"\xF0\x9F\xBF\xBF\"", // U+01FFFF
633 "\"\xF0\xAF\xBF\xBE\"", // U+02FFFE
634 "\"\xF0\xAF\xBF\xBF\"", // U+02FFFF
635 "\"\xF0\xBF\xBF\xBE\"", // U+03FFFE
636 "\"\xF0\xBF\xBF\xBF\"", // U+03FFFF
637 "\"\xF1\x8F\xBF\xBE\"", // U+04FFFE
638 "\"\xF1\x8F\xBF\xBF\"", // U+04FFFF
639 "\"\xF1\x9F\xBF\xBE\"", // U+05FFFE
640 "\"\xF1\x9F\xBF\xBF\"", // U+05FFFF
641 "\"\xF1\xAF\xBF\xBE\"", // U+06FFFE
642 "\"\xF1\xAF\xBF\xBF\"", // U+06FFFF
643 "\"\xF1\xBF\xBF\xBE\"", // U+07FFFE
644 "\"\xF1\xBF\xBF\xBF\"", // U+07FFFF
645 "\"\xF2\x8F\xBF\xBE\"", // U+08FFFE
646 "\"\xF2\x8F\xBF\xBF\"", // U+08FFFF
647 "\"\xF2\x9F\xBF\xBE\"", // U+09FFFE
648 "\"\xF2\x9F\xBF\xBF\"", // U+09FFFF
649 "\"\xF2\xAF\xBF\xBE\"", // U+0AFFFE
650 "\"\xF2\xAF\xBF\xBF\"", // U+0AFFFF
651 "\"\xF2\xBF\xBF\xBE\"", // U+0BFFFE
652 "\"\xF2\xBF\xBF\xBF\"", // U+0BFFFF
653 "\"\xF3\x8F\xBF\xBE\"", // U+0CFFFE
654 "\"\xF3\x8F\xBF\xBF\"", // U+0CFFFF
655 "\"\xF3\x9F\xBF\xBE\"", // U+0DFFFE
656 "\"\xF3\x9F\xBF\xBF\"", // U+0DFFFF
657 "\"\xF3\xAF\xBF\xBE\"", // U+0EFFFE
658 "\"\xF3\xAF\xBF\xBF\"", // U+0EFFFF
659 "\"\xF3\xBF\xBF\xBE\"", // U+0FFFFE
660 "\"\xF3\xBF\xBF\xBF\"", // U+0FFFFF
661 "\"\xF4\x8F\xBF\xBE\"", // U+10FFFE
662 "\"\xF4\x8F\xBF\xBF\"", // U+10FFFF
663 };
664 for (auto* noncharacter : noncharacters) {
665 root = JSONReader::Read(noncharacter);
666 ASSERT_TRUE(root);
667 ASSERT_TRUE(root->is_string());
668 EXPECT_EQ(std::string(noncharacter + 1, strlen(noncharacter) - 2),
669 root->GetString());
670 }
671 }
672
TEST_P(JSONReaderTest,InvalidUTF8Input)673 TEST_P(JSONReaderTest, InvalidUTF8Input) {
674 EXPECT_FALSE(JSONReader::Read("\"345\xb0\xa1\xb0\xa2\""));
675 EXPECT_FALSE(JSONReader::Read("\"123\xc0\x81\""));
676 EXPECT_FALSE(JSONReader::Read("\"abc\xc0\xae\""));
677 }
678
TEST_P(JSONReaderTest,UTF16Escapes)679 TEST_P(JSONReaderTest, UTF16Escapes) {
680 absl::optional<Value> root = JSONReader::Read("\"\\u20ac3,14\"");
681 ASSERT_TRUE(root);
682 ASSERT_TRUE(root->is_string());
683 EXPECT_EQ(
684 "\xe2\x82\xac"
685 "3,14",
686 root->GetString());
687
688 root = JSONReader::Read("\"\\ud83d\\udca9\\ud83d\\udc6c\"");
689 ASSERT_TRUE(root);
690 ASSERT_TRUE(root->is_string());
691 EXPECT_EQ("\xf0\x9f\x92\xa9\xf0\x9f\x91\xac", root->GetString());
692 }
693
TEST_P(JSONReaderTest,InvalidUTF16Escapes)694 TEST_P(JSONReaderTest, InvalidUTF16Escapes) {
695 const char* const cases[] = {
696 "\"\\u123\"", // Invalid scalar.
697 "\"\\ud83d\"", // Invalid scalar.
698 "\"\\u$%@!\"", // Invalid scalar.
699 "\"\\uzz89\"", // Invalid scalar.
700 "\"\\ud83d\\udca\"", // Invalid lower surrogate.
701 "\"\\ud83d\\ud83d\"", // Invalid lower surrogate.
702 "\"\\ud83d\\uaaaZ\"", // Invalid lower surrogate.
703 "\"\\ud83foo\"", // No lower surrogate.
704 "\"\\ud83d\\foo\"", // No lower surrogate.
705 "\"\\ud83\\foo\"", // Invalid upper surrogate.
706 "\"\\ud83d\\u1\"", // No lower surrogate.
707 "\"\\ud83\\u1\"", // Invalid upper surrogate.
708 };
709 absl::optional<Value> root;
710 for (auto* i : cases) {
711 root = JSONReader::Read(i);
712 EXPECT_FALSE(root) << i;
713 }
714 }
715
TEST_P(JSONReaderTest,LiteralRoots)716 TEST_P(JSONReaderTest, LiteralRoots) {
717 absl::optional<Value> root = JSONReader::Read("null");
718 ASSERT_TRUE(root);
719 EXPECT_TRUE(root->is_none());
720
721 root = JSONReader::Read("true");
722 ASSERT_TRUE(root);
723 ASSERT_TRUE(root->is_bool());
724 EXPECT_TRUE(root->GetBool());
725
726 root = JSONReader::Read("10");
727 ASSERT_TRUE(root);
728 ASSERT_TRUE(root->is_int());
729 EXPECT_EQ(10, root->GetInt());
730
731 root = JSONReader::Read("\"root\"");
732 ASSERT_TRUE(root);
733 ASSERT_TRUE(root->is_string());
734 EXPECT_EQ("root", root->GetString());
735 }
736
TEST_P(JSONReaderTest,ReadFromFile)737 TEST_P(JSONReaderTest, ReadFromFile) {
738 FilePath path;
739 ASSERT_TRUE(PathService::Get(base::DIR_TEST_DATA, &path));
740 path = path.AppendASCII("json");
741 ASSERT_TRUE(base::PathExists(path));
742
743 std::string input;
744 ASSERT_TRUE(ReadFileToString(path.AppendASCII("bom_feff.json"), &input));
745
746 EXPECT_THAT(
747 JSONReader::ReadAndReturnValueWithError(input),
748 base::test::ValueIs(::testing::Property(&base::Value::is_dict, true)));
749 }
750
751 // Tests that the root of a JSON object can be deleted safely while its
752 // children outlive it.
TEST_P(JSONReaderTest,StringOptimizations)753 TEST_P(JSONReaderTest, StringOptimizations) {
754 Value dict_literal_0;
755 Value dict_literal_1;
756 Value dict_string_0;
757 Value dict_string_1;
758 Value list_value_0;
759 Value list_value_1;
760
761 {
762 absl::optional<Value> root = JSONReader::Read(
763 "{"
764 " \"test\": {"
765 " \"foo\": true,"
766 " \"bar\": 3.14,"
767 " \"baz\": \"bat\","
768 " \"moo\": \"cow\""
769 " },"
770 " \"list\": ["
771 " \"a\","
772 " \"b\""
773 " ]"
774 "}",
775 JSON_PARSE_RFC);
776 ASSERT_TRUE(root);
777 Value::Dict* root_dict = root->GetIfDict();
778 ASSERT_TRUE(root_dict);
779
780 Value::Dict* dict = root_dict->FindDict("test");
781 ASSERT_TRUE(dict);
782 Value::List* list = root_dict->FindList("list");
783 ASSERT_TRUE(list);
784
785 Value* to_move = dict->Find("foo");
786 ASSERT_TRUE(to_move);
787 dict_literal_0 = std::move(*to_move);
788 to_move = dict->Find("bar");
789 ASSERT_TRUE(to_move);
790 dict_literal_1 = std::move(*to_move);
791 to_move = dict->Find("baz");
792 ASSERT_TRUE(to_move);
793 dict_string_0 = std::move(*to_move);
794 to_move = dict->Find("moo");
795 ASSERT_TRUE(to_move);
796 dict_string_1 = std::move(*to_move);
797 ASSERT_TRUE(dict->Remove("foo"));
798 ASSERT_TRUE(dict->Remove("bar"));
799 ASSERT_TRUE(dict->Remove("baz"));
800 ASSERT_TRUE(dict->Remove("moo"));
801
802 ASSERT_EQ(2u, list->size());
803 list_value_0 = std::move((*list)[0]);
804 list_value_1 = std::move((*list)[1]);
805 list->clear();
806 }
807
808 ASSERT_TRUE(dict_literal_0.is_bool());
809 EXPECT_TRUE(dict_literal_0.GetBool());
810
811 ASSERT_TRUE(dict_literal_1.is_double());
812 EXPECT_EQ(3.14, dict_literal_1.GetDouble());
813
814 ASSERT_TRUE(dict_string_0.is_string());
815 EXPECT_EQ("bat", dict_string_0.GetString());
816
817 ASSERT_TRUE(dict_string_1.is_string());
818 EXPECT_EQ("cow", dict_string_1.GetString());
819
820 ASSERT_TRUE(list_value_0.is_string());
821 EXPECT_EQ("a", list_value_0.GetString());
822 ASSERT_TRUE(list_value_1.is_string());
823 EXPECT_EQ("b", list_value_1.GetString());
824 }
825
826 // A smattering of invalid JSON designed to test specific portions of the
827 // parser implementation against buffer overflow. Best run with DCHECKs so
828 // that the one in NextChar fires.
TEST_P(JSONReaderTest,InvalidSanity)829 TEST_P(JSONReaderTest, InvalidSanity) {
830 const char* const kInvalidJson[] = {
831 "/* test *", "{\"foo\"", "{\"foo\":", " [", "\"\\u123g\"", "{\n\"eh:\n}",
832 };
833
834 for (size_t i = 0; i < std::size(kInvalidJson); ++i) {
835 LOG(INFO) << "Sanity test " << i << ": <" << kInvalidJson[i] << ">";
836 auto root = JSONReader::ReadAndReturnValueWithError(kInvalidJson[i]);
837 EXPECT_FALSE(root.has_value());
838 EXPECT_NE("", root.error().message);
839 }
840 }
841
TEST_P(JSONReaderTest,IllegalTrailingNull)842 TEST_P(JSONReaderTest, IllegalTrailingNull) {
843 const char json[] = {'"', 'n', 'u', 'l', 'l', '"', '\0'};
844 std::string json_string(json, sizeof(json));
845 auto root = JSONReader::ReadAndReturnValueWithError(json_string);
846 EXPECT_FALSE(root.has_value());
847 EXPECT_NE("", root.error().message);
848 }
849
TEST_P(JSONReaderTest,ASCIIControlCodes)850 TEST_P(JSONReaderTest, ASCIIControlCodes) {
851 // A literal NUL byte or a literal new line, in a JSON string, should be
852 // rejected. RFC 8259 section 7 says "the characters that MUST be escaped
853 // [include]... the control characters (U+0000 through U+001F)".
854 //
855 // Nonetheless, we accept them, for backwards compatibility.
856 const char json[] = {'"', 'a', '\0', 'b', '\n', 'c', '"'};
857 absl::optional<Value> root =
858 JSONReader::Read(std::string(json, sizeof(json)));
859 ASSERT_TRUE(root);
860 ASSERT_TRUE(root->is_string());
861 EXPECT_EQ(5u, root->GetString().length());
862 }
863
TEST_P(JSONReaderTest,MaxNesting)864 TEST_P(JSONReaderTest, MaxNesting) {
865 std::string json(R"({"outer": { "inner": {"foo": true}}})");
866 EXPECT_FALSE(JSONReader::Read(json, JSON_PARSE_RFC, 3));
867 EXPECT_TRUE(JSONReader::Read(json, JSON_PARSE_RFC, 4));
868 }
869
TEST_P(JSONReaderTest,Decode4ByteUtf8Char)870 TEST_P(JSONReaderTest, Decode4ByteUtf8Char) {
871 // kUtf8Data contains a 4 byte unicode character (a smiley!) that JSONReader
872 // should be able to handle. The UTF-8 encoding of U+1F607 SMILING FACE WITH
873 // HALO is "\xF0\x9F\x98\x87".
874 const char kUtf8Data[] = "[\"\",[],[],[],{\"google:suggesttype\":[]}]";
875 absl::optional<Value> root = JSONReader::Read(kUtf8Data, JSON_PARSE_RFC);
876 ASSERT_TRUE(root);
877 Value::List* list = root->GetIfList();
878 ASSERT_TRUE(list);
879 ASSERT_EQ(5u, list->size());
880 ASSERT_TRUE((*list)[0].is_string());
881 EXPECT_EQ("\xF0\x9F\x98\x87", (*list)[0].GetString());
882 }
883
TEST_P(JSONReaderTest,DecodeUnicodeNonCharacter)884 TEST_P(JSONReaderTest, DecodeUnicodeNonCharacter) {
885 // Tests Unicode code points (encoded as escaped UTF-16) that are not valid
886 // characters.
887 EXPECT_TRUE(JSONReader::Read("[\"\\uFDD0\"]")); // U+FDD0
888 EXPECT_TRUE(JSONReader::Read("[\"\\uFDDF\"]")); // U+FDDF
889 EXPECT_TRUE(JSONReader::Read("[\"\\uFDEF\"]")); // U+FDEF
890 EXPECT_TRUE(JSONReader::Read("[\"\\uFFFE\"]")); // U+FFFE
891 EXPECT_TRUE(JSONReader::Read("[\"\\uFFFF\"]")); // U+FFFF
892 EXPECT_TRUE(JSONReader::Read("[\"\\uD83F\\uDFFE\"]")); // U+01FFFE
893 EXPECT_TRUE(JSONReader::Read("[\"\\uD83F\\uDFFF\"]")); // U+01FFFF
894 EXPECT_TRUE(JSONReader::Read("[\"\\uD87F\\uDFFE\"]")); // U+02FFFE
895 EXPECT_TRUE(JSONReader::Read("[\"\\uD87F\\uDFFF\"]")); // U+02FFFF
896 EXPECT_TRUE(JSONReader::Read("[\"\\uD8BF\\uDFFE\"]")); // U+03FFFE
897 EXPECT_TRUE(JSONReader::Read("[\"\\uD8BF\\uDFFF\"]")); // U+03FFFF
898 EXPECT_TRUE(JSONReader::Read("[\"\\uD8FF\\uDFFE\"]")); // U+04FFFE
899 EXPECT_TRUE(JSONReader::Read("[\"\\uD8FF\\uDFFF\"]")); // U+04FFFF
900 EXPECT_TRUE(JSONReader::Read("[\"\\uD93F\\uDFFE\"]")); // U+05FFFE
901 EXPECT_TRUE(JSONReader::Read("[\"\\uD93F\\uDFFF\"]")); // U+05FFFF
902 EXPECT_TRUE(JSONReader::Read("[\"\\uD97F\\uDFFE\"]")); // U+06FFFE
903 EXPECT_TRUE(JSONReader::Read("[\"\\uD97F\\uDFFF\"]")); // U+06FFFF
904 EXPECT_TRUE(JSONReader::Read("[\"\\uD9BF\\uDFFE\"]")); // U+07FFFE
905 EXPECT_TRUE(JSONReader::Read("[\"\\uD9BF\\uDFFF\"]")); // U+07FFFF
906 EXPECT_TRUE(JSONReader::Read("[\"\\uD9FF\\uDFFE\"]")); // U+08FFFE
907 EXPECT_TRUE(JSONReader::Read("[\"\\uD9FF\\uDFFF\"]")); // U+08FFFF
908 EXPECT_TRUE(JSONReader::Read("[\"\\uDA3F\\uDFFE\"]")); // U+09FFFE
909 EXPECT_TRUE(JSONReader::Read("[\"\\uDA3F\\uDFFF\"]")); // U+09FFFF
910 EXPECT_TRUE(JSONReader::Read("[\"\\uDA7F\\uDFFE\"]")); // U+0AFFFE
911 EXPECT_TRUE(JSONReader::Read("[\"\\uDA7F\\uDFFF\"]")); // U+0AFFFF
912 EXPECT_TRUE(JSONReader::Read("[\"\\uDABF\\uDFFE\"]")); // U+0BFFFE
913 EXPECT_TRUE(JSONReader::Read("[\"\\uDABF\\uDFFF\"]")); // U+0BFFFF
914 EXPECT_TRUE(JSONReader::Read("[\"\\uDAFF\\uDFFE\"]")); // U+0CFFFE
915 EXPECT_TRUE(JSONReader::Read("[\"\\uDAFF\\uDFFF\"]")); // U+0CFFFF
916 EXPECT_TRUE(JSONReader::Read("[\"\\uDB3F\\uDFFE\"]")); // U+0DFFFE
917 EXPECT_TRUE(JSONReader::Read("[\"\\uDB3F\\uDFFF\"]")); // U+0DFFFF
918 EXPECT_TRUE(JSONReader::Read("[\"\\uDB7F\\uDFFE\"]")); // U+0EFFFE
919 EXPECT_TRUE(JSONReader::Read("[\"\\uDB7F\\uDFFF\"]")); // U+0EFFFF
920 EXPECT_TRUE(JSONReader::Read("[\"\\uDBBF\\uDFFE\"]")); // U+0FFFFE
921 EXPECT_TRUE(JSONReader::Read("[\"\\uDBBF\\uDFFF\"]")); // U+0FFFFF
922 EXPECT_TRUE(JSONReader::Read("[\"\\uDBFF\\uDFFE\"]")); // U+10FFFE
923 EXPECT_TRUE(JSONReader::Read("[\"\\uDBFF\\uDFFF\"]")); // U+10FFFF
924 }
925
TEST_P(JSONReaderTest,DecodeNegativeEscapeSequence)926 TEST_P(JSONReaderTest, DecodeNegativeEscapeSequence) {
927 EXPECT_FALSE(JSONReader::Read("[\"\\x-A\"]"));
928 EXPECT_FALSE(JSONReader::Read("[\"\\u-00A\"]"));
929 }
930
931 // Verifies invalid code points are replaced.
TEST_P(JSONReaderTest,ReplaceInvalidCharacters)932 TEST_P(JSONReaderTest, ReplaceInvalidCharacters) {
933 // U+D800 is a lone high surrogate.
934 const std::string invalid_high = "\"\xED\xA0\x80\"";
935 absl::optional<Value> value =
936 JSONReader::Read(invalid_high, JSON_REPLACE_INVALID_CHARACTERS);
937 ASSERT_TRUE(value);
938 ASSERT_TRUE(value->is_string());
939 // Expect three U+FFFD (one for each UTF-8 byte in the invalid code point).
940 EXPECT_EQ("\xEF\xBF\xBD\xEF\xBF\xBD\xEF\xBF\xBD", value->GetString());
941
942 // U+DFFF is a lone low surrogate.
943 const std::string invalid_low = "\"\xED\xBF\xBF\"";
944 value = JSONReader::Read(invalid_low, JSON_REPLACE_INVALID_CHARACTERS);
945 ASSERT_TRUE(value);
946 ASSERT_TRUE(value->is_string());
947 // Expect three U+FFFD (one for each UTF-8 byte in the invalid code point).
948 EXPECT_EQ("\xEF\xBF\xBD\xEF\xBF\xBD\xEF\xBF\xBD", value->GetString());
949 }
950
TEST_P(JSONReaderTest,ReplaceInvalidUTF16EscapeSequence)951 TEST_P(JSONReaderTest, ReplaceInvalidUTF16EscapeSequence) {
952 // U+D800 is a lone high surrogate.
953 const std::string invalid_high = "\"_\\uD800_\"";
954 absl::optional<Value> value =
955 JSONReader::Read(invalid_high, JSON_REPLACE_INVALID_CHARACTERS);
956 ASSERT_TRUE(value);
957 ASSERT_TRUE(value->is_string());
958 EXPECT_EQ("_\xEF\xBF\xBD_", value->GetString());
959
960 // U+DFFF is a lone low surrogate.
961 const std::string invalid_low = "\"_\\uDFFF_\"";
962 value = JSONReader::Read(invalid_low, JSON_REPLACE_INVALID_CHARACTERS);
963 ASSERT_TRUE(value);
964 ASSERT_TRUE(value->is_string());
965 EXPECT_EQ("_\xEF\xBF\xBD_", value->GetString());
966 }
967
TEST_P(JSONReaderTest,ParseNumberErrors)968 TEST_P(JSONReaderTest, ParseNumberErrors) {
969 const struct {
970 const char* input;
971 bool parse_success;
972 double value;
973 } kCases[] = {
974 // clang-format off
975 {"1", true, 1},
976 {"2.", false, 0},
977 {"42", true, 42},
978 {"6e", false, 0},
979 {"43e2", true, 4300},
980 {"43e-", false, 0},
981 {"9e-3", true, 0.009},
982 {"2e+", false, 0},
983 {"2e+2", true, 200},
984 // clang-format on
985 };
986
987 for (unsigned int i = 0; i < std::size(kCases); ++i) {
988 auto test_case = kCases[i];
989 SCOPED_TRACE(StringPrintf("case %u: \"%s\"", i, test_case.input));
990
991 std::unique_ptr<char[]> input_owner;
992 StringPiece input =
993 MakeNotNullTerminatedInput(test_case.input, &input_owner);
994
995 absl::optional<Value> result = JSONReader::Read(input);
996 EXPECT_EQ(test_case.parse_success, result.has_value());
997
998 if (!result)
999 continue;
1000
1001 ASSERT_TRUE(result->is_double() || result->is_int());
1002 EXPECT_EQ(test_case.value, result->GetDouble());
1003 }
1004 }
1005
TEST_P(JSONReaderTest,UnterminatedInputs)1006 TEST_P(JSONReaderTest, UnterminatedInputs) {
1007 const char* const kCases[] = {
1008 // clang-format off
1009 "/",
1010 "//",
1011 "/*",
1012 "\"xxxxxx",
1013 "\"",
1014 "{ ",
1015 "[\t",
1016 "tru",
1017 "fals",
1018 "nul",
1019 "\"\\x",
1020 "\"\\x2",
1021 "\"\\u123",
1022 "\"\\uD803\\u",
1023 "\"\\",
1024 "\"\\/",
1025 // clang-format on
1026 };
1027
1028 for (unsigned int i = 0; i < std::size(kCases); ++i) {
1029 auto* test_case = kCases[i];
1030 SCOPED_TRACE(StringPrintf("case %u: \"%s\"", i, test_case));
1031
1032 std::unique_ptr<char[]> input_owner;
1033 StringPiece input = MakeNotNullTerminatedInput(test_case, &input_owner);
1034
1035 EXPECT_FALSE(JSONReader::Read(input));
1036 }
1037 }
1038
TEST_P(JSONReaderTest,LineColumnCounting)1039 TEST_P(JSONReaderTest, LineColumnCounting) {
1040 const struct {
1041 const char* input;
1042 int error_line;
1043 int error_column;
1044 } kCases[] = {
1045 // For all but the "q_is_not_etc" case, the error (indicated by ^ in the
1046 // comments) is seeing a digit when expecting ',' or ']'.
1047 {
1048 // Line and column counts are 1-based, not 0-based.
1049 "q_is_not_the_start_of_any_valid_JSON_token",
1050 1,
1051 1,
1052 },
1053 {
1054 "[2,4,6 8",
1055 // -----^
1056 1,
1057 8,
1058 },
1059 {
1060 "[2,4,6\t8",
1061 // ------^
1062 1,
1063 8,
1064 },
1065 {
1066 "[2,4,6\n8",
1067 // ------^
1068 2,
1069 1,
1070 },
1071 {
1072 "[\n0,\n1,\n2,\n3,4,5,6 7,\n8,\n9\n]",
1073 // ---------------------^
1074 5,
1075 9,
1076 },
1077 {
1078 // Same as the previous example, but with "\r\n"s instead of "\n"s.
1079 "[\r\n0,\r\n1,\r\n2,\r\n3,4,5,6 7,\r\n8,\r\n9\r\n]",
1080 // -----------------------------^
1081 5,
1082 9,
1083 },
1084 // The JSON spec forbids unescaped ASCII control characters (including
1085 // line breaks) within a string, but our implementation is more lenient.
1086 {
1087 "[\"3\n1\" 4",
1088 // --------^
1089 2,
1090 4,
1091 },
1092 {
1093 "[\"3\r\n1\" 4",
1094 // ----------^
1095 2,
1096 4,
1097 },
1098 };
1099
1100 for (unsigned int i = 0; i < std::size(kCases); ++i) {
1101 auto test_case = kCases[i];
1102 SCOPED_TRACE(StringPrintf("case %u: \"%s\"", i, test_case.input));
1103
1104 auto root = JSONReader::ReadAndReturnValueWithError(
1105 test_case.input, JSON_PARSE_RFC | JSON_ALLOW_CONTROL_CHARS);
1106 EXPECT_FALSE(root.has_value());
1107 EXPECT_EQ(test_case.error_line, root.error().line);
1108 EXPECT_EQ(test_case.error_column, root.error().column);
1109 }
1110 }
1111
TEST_P(JSONReaderTest,ChromiumExtensions)1112 TEST_P(JSONReaderTest, ChromiumExtensions) {
1113 // All of these cases should parse with JSON_PARSE_CHROMIUM_EXTENSIONS but
1114 // fail with JSON_PARSE_RFC.
1115 const struct {
1116 // The JSON input.
1117 const char* input;
1118 // What JSON_* option permits this extension.
1119 int option;
1120 } kCases[] = {
1121 {"{ /* comment */ \"foo\": 3 }", JSON_ALLOW_COMMENTS},
1122 {"{ // comment\n \"foo\": 3 }", JSON_ALLOW_COMMENTS},
1123 {"[\"\\xAB\"]", JSON_ALLOW_X_ESCAPES},
1124 {"[\"\b\"]", JSON_ALLOW_CONTROL_CHARS},
1125 {"[\"\f\"]", JSON_ALLOW_CONTROL_CHARS},
1126 {"[\"\n\"]", JSON_ALLOW_CONTROL_CHARS},
1127 {"[\"\r\"]", JSON_ALLOW_CONTROL_CHARS},
1128 {"[\"\t\"]", JSON_ALLOW_CONTROL_CHARS},
1129 {"[\"\v\"]", JSON_ALLOW_CONTROL_CHARS},
1130 {"[\"\\v\"]", JSON_ALLOW_VERT_TAB},
1131 };
1132
1133 for (size_t i = 0; i < std::size(kCases); ++i) {
1134 SCOPED_TRACE(testing::Message() << "case " << i);
1135 const auto& test_case = kCases[i];
1136
1137 auto result = JSONReader::ReadAndReturnValueWithError(test_case.input,
1138 JSON_PARSE_RFC);
1139 EXPECT_FALSE(result.has_value());
1140
1141 result = JSONReader::ReadAndReturnValueWithError(
1142 test_case.input, JSON_PARSE_RFC | test_case.option);
1143 EXPECT_TRUE(result.has_value());
1144
1145 result = JSONReader::ReadAndReturnValueWithError(
1146 test_case.input, JSON_PARSE_CHROMIUM_EXTENSIONS);
1147 EXPECT_TRUE(result.has_value());
1148
1149 result = JSONReader::ReadAndReturnValueWithError(
1150 test_case.input, JSON_PARSE_CHROMIUM_EXTENSIONS & ~test_case.option);
1151 EXPECT_FALSE(result.has_value());
1152 }
1153 }
1154
TEST_P(JSONReaderTest,UsingRust)1155 TEST_P(JSONReaderTest, UsingRust) {
1156 ASSERT_EQ(JSONReader::UsingRust(), using_rust_);
1157 }
1158
1159 INSTANTIATE_TEST_SUITE_P(All,
1160 JSONReaderTest,
1161 #if BUILDFLAG(BUILD_RUST_JSON_READER)
1162 testing::Bool(),
1163 #else // BUILDFLAG(BUILD_RUST_JSON_READER)
1164 testing::Values(false),
1165 #endif // BUILDFLAG(BUILD_RUST_JSON_READER)
__anonc1092b710502(const testing::TestParamInfo<bool>& info) 1166 [](const testing::TestParamInfo<bool>& info) {
1167 return info.param ? "Rust" : "Cpp";
1168 });
1169
1170 } // namespace base
1171