1 // Copyright 2013 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "components/policy/core/common/schema.h"
6
7 #include <algorithm>
8 #include <climits>
9 #include <map>
10 #include <utility>
11
12 #include "base/compiler_specific.h"
13 #include "base/logging.h"
14 #include "base/memory/scoped_ptr.h"
15 #include "base/memory/scoped_vector.h"
16 #include "base/stl_util.h"
17 #include "base/strings/stringprintf.h"
18 #include "components/json_schema/json_schema_constants.h"
19 #include "components/json_schema/json_schema_validator.h"
20 #include "components/policy/core/common/schema_internal.h"
21 #include "third_party/re2/re2/re2.h"
22
23 namespace schema = json_schema_constants;
24
25 namespace policy {
26
27 using internal::PropertiesNode;
28 using internal::PropertyNode;
29 using internal::RestrictionNode;
30 using internal::SchemaData;
31 using internal::SchemaNode;
32
33 namespace {
34
35 // Maps schema "id" attributes to the corresponding SchemaNode index.
36 typedef std::map<std::string, int> IdMap;
37
38 // List of pairs of references to be assigned later. The string is the "id"
39 // whose corresponding index should be stored in the pointer, once all the IDs
40 // are available.
41 typedef std::vector<std::pair<std::string, int*> > ReferenceList;
42
43 // Sizes for the storage arrays. These are calculated in advance so that the
44 // arrays don't have to be resized during parsing, which would invalidate
45 // pointers into their contents (i.e. string's c_str() and address of indices
46 // for "$ref" attributes).
47 struct StorageSizes {
StorageSizespolicy::__anonb5a8514b0111::StorageSizes48 StorageSizes()
49 : strings(0), schema_nodes(0), property_nodes(0), properties_nodes(0),
50 restriction_nodes(0), int_enums(0), string_enums(0) { }
51 size_t strings;
52 size_t schema_nodes;
53 size_t property_nodes;
54 size_t properties_nodes;
55 size_t restriction_nodes;
56 size_t int_enums;
57 size_t string_enums;
58 };
59
60 // An invalid index, indicating that a node is not present; similar to a NULL
61 // pointer.
62 const int kInvalid = -1;
63
SchemaTypeToValueType(const std::string & type_string,base::Value::Type * type)64 bool SchemaTypeToValueType(const std::string& type_string,
65 base::Value::Type* type) {
66 // Note: "any" is not an accepted type.
67 static const struct {
68 const char* schema_type;
69 base::Value::Type value_type;
70 } kSchemaToValueTypeMap[] = {
71 { schema::kArray, base::Value::TYPE_LIST },
72 { schema::kBoolean, base::Value::TYPE_BOOLEAN },
73 { schema::kInteger, base::Value::TYPE_INTEGER },
74 { schema::kNull, base::Value::TYPE_NULL },
75 { schema::kNumber, base::Value::TYPE_DOUBLE },
76 { schema::kObject, base::Value::TYPE_DICTIONARY },
77 { schema::kString, base::Value::TYPE_STRING },
78 };
79 for (size_t i = 0; i < ARRAYSIZE_UNSAFE(kSchemaToValueTypeMap); ++i) {
80 if (kSchemaToValueTypeMap[i].schema_type == type_string) {
81 *type = kSchemaToValueTypeMap[i].value_type;
82 return true;
83 }
84 }
85 return false;
86 }
87
StrategyAllowInvalidOnTopLevel(SchemaOnErrorStrategy strategy)88 bool StrategyAllowInvalidOnTopLevel(SchemaOnErrorStrategy strategy) {
89 return strategy == SCHEMA_ALLOW_INVALID ||
90 strategy == SCHEMA_ALLOW_INVALID_TOPLEVEL ||
91 strategy == SCHEMA_ALLOW_INVALID_TOPLEVEL_AND_ALLOW_UNKNOWN;
92 }
93
StrategyAllowUnknownOnTopLevel(SchemaOnErrorStrategy strategy)94 bool StrategyAllowUnknownOnTopLevel(SchemaOnErrorStrategy strategy) {
95 return strategy != SCHEMA_STRICT;
96 }
97
StrategyForNextLevel(SchemaOnErrorStrategy strategy)98 SchemaOnErrorStrategy StrategyForNextLevel(SchemaOnErrorStrategy strategy) {
99 static SchemaOnErrorStrategy next_level_strategy[] = {
100 SCHEMA_STRICT, // SCHEMA_STRICT
101 SCHEMA_STRICT, // SCHEMA_ALLOW_UNKNOWN_TOPLEVEL
102 SCHEMA_ALLOW_UNKNOWN, // SCHEMA_ALLOW_UNKNOWN
103 SCHEMA_STRICT, // SCHEMA_ALLOW_INVALID_TOPLEVEL
104 SCHEMA_ALLOW_UNKNOWN, // SCHEMA_ALLOW_INVALID_TOPLEVEL_AND_ALLOW_UNKNOWN
105 SCHEMA_ALLOW_INVALID, // SCHEMA_ALLOW_INVALID
106 };
107 return next_level_strategy[(int)strategy];
108 }
109
SchemaErrorFound(std::string * error_path,std::string * error,const std::string & msg)110 void SchemaErrorFound(std::string* error_path,
111 std::string* error,
112 const std::string& msg) {
113 if (error_path)
114 *error_path = "";
115 *error = msg;
116 }
117
AddListIndexPrefixToPath(int index,std::string * path)118 void AddListIndexPrefixToPath(int index, std::string* path) {
119 if (path) {
120 if (path->empty())
121 *path = base::StringPrintf("items[%d]", index);
122 else
123 *path = base::StringPrintf("items[%d].", index) + *path;
124 }
125 }
126
AddDictKeyPrefixToPath(const std::string & key,std::string * path)127 void AddDictKeyPrefixToPath(const std::string& key, std::string* path) {
128 if (path) {
129 if (path->empty())
130 *path = key;
131 else
132 *path = key + "." + *path;
133 }
134 }
135
136 } // namespace
137
138 // Contains the internal data representation of a Schema. This can either wrap
139 // a SchemaData owned elsewhere (currently used to wrap the Chrome schema, which
140 // is generated at compile time), or it can own its own SchemaData.
141 class Schema::InternalStorage
142 : public base::RefCountedThreadSafe<InternalStorage> {
143 public:
144 static scoped_refptr<const InternalStorage> Wrap(const SchemaData* data);
145
146 static scoped_refptr<const InternalStorage> ParseSchema(
147 const base::DictionaryValue& schema,
148 std::string* error);
149
data() const150 const SchemaData* data() const { return &schema_data_; }
151
root_node() const152 const SchemaNode* root_node() const {
153 return schema(0);
154 }
155
schema(int index) const156 const SchemaNode* schema(int index) const {
157 return schema_data_.schema_nodes + index;
158 }
159
properties(int index) const160 const PropertiesNode* properties(int index) const {
161 return schema_data_.properties_nodes + index;
162 }
163
property(int index) const164 const PropertyNode* property(int index) const {
165 return schema_data_.property_nodes + index;
166 }
167
restriction(int index) const168 const RestrictionNode* restriction(int index) const {
169 return schema_data_.restriction_nodes + index;
170 }
171
int_enums(int index) const172 const int* int_enums(int index) const {
173 return schema_data_.int_enums + index;
174 }
175
string_enums(int index) const176 const char** string_enums(int index) const {
177 return schema_data_.string_enums + index;
178 }
179
180 // Compiles regular expression |pattern|. The result is cached and will be
181 // returned directly next time.
182 re2::RE2* CompileRegex(const std::string& pattern) const;
183
184 private:
185 friend class base::RefCountedThreadSafe<InternalStorage>;
186
187 InternalStorage();
188 ~InternalStorage();
189
190 // Determines the expected |sizes| of the storage for the representation
191 // of |schema|.
192 static void DetermineStorageSizes(const base::DictionaryValue& schema,
193 StorageSizes* sizes);
194
195 // Parses the JSON schema in |schema|.
196 //
197 // If |schema| has a "$ref" attribute then a pending reference is appended
198 // to the |reference_list|, and nothing else is done.
199 //
200 // Otherwise, |index| gets assigned the index of the corresponding SchemaNode
201 // in |schema_nodes_|. If the |schema| contains an "id" then that ID is mapped
202 // to the |index| in the |id_map|.
203 //
204 // If |schema| is invalid then |error| gets the error reason and false is
205 // returned. Otherwise returns true.
206 bool Parse(const base::DictionaryValue& schema,
207 int* index,
208 IdMap* id_map,
209 ReferenceList* reference_list,
210 std::string* error);
211
212 // Helper for Parse() that gets an already assigned |schema_node| instead of
213 // an |index| pointer.
214 bool ParseDictionary(const base::DictionaryValue& schema,
215 SchemaNode* schema_node,
216 IdMap* id_map,
217 ReferenceList* reference_list,
218 std::string* error);
219
220 // Helper for Parse() that gets an already assigned |schema_node| instead of
221 // an |index| pointer.
222 bool ParseList(const base::DictionaryValue& schema,
223 SchemaNode* schema_node,
224 IdMap* id_map,
225 ReferenceList* reference_list,
226 std::string* error);
227
228 bool ParseEnum(const base::DictionaryValue& schema,
229 base::Value::Type type,
230 SchemaNode* schema_node,
231 std::string* error);
232
233 bool ParseRangedInt(const base::DictionaryValue& schema,
234 SchemaNode* schema_node,
235 std::string* error);
236
237 bool ParseStringPattern(const base::DictionaryValue& schema,
238 SchemaNode* schema_node,
239 std::string* error);
240
241 // Assigns the IDs in |id_map| to the pending references in the
242 // |reference_list|. If an ID is missing then |error| is set and false is
243 // returned; otherwise returns true.
244 static bool ResolveReferences(const IdMap& id_map,
245 const ReferenceList& reference_list,
246 std::string* error);
247
248 // Cache for CompileRegex(), will memorize return value of every call to
249 // CompileRegex() and return results directly next time.
250 mutable std::map<std::string, re2::RE2*> regex_cache_;
251 STLValueDeleter<std::map<std::string, re2::RE2*> > regex_cache_deleter_;
252
253 SchemaData schema_data_;
254 std::vector<std::string> strings_;
255 std::vector<SchemaNode> schema_nodes_;
256 std::vector<PropertyNode> property_nodes_;
257 std::vector<PropertiesNode> properties_nodes_;
258 std::vector<RestrictionNode> restriction_nodes_;
259 std::vector<int> int_enums_;
260 std::vector<const char*> string_enums_;
261
262 DISALLOW_COPY_AND_ASSIGN(InternalStorage);
263 };
264
InternalStorage()265 Schema::InternalStorage::InternalStorage()
266 : regex_cache_deleter_(®ex_cache_) {}
267
~InternalStorage()268 Schema::InternalStorage::~InternalStorage() {}
269
270 // static
Wrap(const SchemaData * data)271 scoped_refptr<const Schema::InternalStorage> Schema::InternalStorage::Wrap(
272 const SchemaData* data) {
273 InternalStorage* storage = new InternalStorage();
274 storage->schema_data_.schema_nodes = data->schema_nodes;
275 storage->schema_data_.property_nodes = data->property_nodes;
276 storage->schema_data_.properties_nodes = data->properties_nodes;
277 storage->schema_data_.restriction_nodes = data->restriction_nodes;
278 storage->schema_data_.int_enums = data->int_enums;
279 storage->schema_data_.string_enums = data->string_enums;
280 return storage;
281 }
282
283 // static
284 scoped_refptr<const Schema::InternalStorage>
ParseSchema(const base::DictionaryValue & schema,std::string * error)285 Schema::InternalStorage::ParseSchema(const base::DictionaryValue& schema,
286 std::string* error) {
287 // Determine the sizes of the storage arrays and reserve the capacity before
288 // starting to append nodes and strings. This is important to prevent the
289 // arrays from being reallocated, which would invalidate the c_str() pointers
290 // and the addresses of indices to fix.
291 StorageSizes sizes;
292 DetermineStorageSizes(schema, &sizes);
293
294 scoped_refptr<InternalStorage> storage = new InternalStorage();
295 storage->strings_.reserve(sizes.strings);
296 storage->schema_nodes_.reserve(sizes.schema_nodes);
297 storage->property_nodes_.reserve(sizes.property_nodes);
298 storage->properties_nodes_.reserve(sizes.properties_nodes);
299 storage->restriction_nodes_.reserve(sizes.restriction_nodes);
300 storage->int_enums_.reserve(sizes.int_enums);
301 storage->string_enums_.reserve(sizes.string_enums);
302
303 int root_index = kInvalid;
304 IdMap id_map;
305 ReferenceList reference_list;
306 if (!storage->Parse(schema, &root_index, &id_map, &reference_list, error))
307 return NULL;
308
309 if (root_index == kInvalid) {
310 *error = "The main schema can't have a $ref";
311 return NULL;
312 }
313
314 // None of this should ever happen without having been already detected.
315 // But, if it does happen, then it will lead to corrupted memory; drop
316 // everything in that case.
317 if (root_index != 0 ||
318 sizes.strings != storage->strings_.size() ||
319 sizes.schema_nodes != storage->schema_nodes_.size() ||
320 sizes.property_nodes != storage->property_nodes_.size() ||
321 sizes.properties_nodes != storage->properties_nodes_.size() ||
322 sizes.restriction_nodes != storage->restriction_nodes_.size() ||
323 sizes.int_enums != storage->int_enums_.size() ||
324 sizes.string_enums != storage->string_enums_.size()) {
325 *error = "Failed to parse the schema due to a Chrome bug. Please file a "
326 "new issue at http://crbug.com";
327 return NULL;
328 }
329
330 if (!ResolveReferences(id_map, reference_list, error))
331 return NULL;
332
333 SchemaData* data = &storage->schema_data_;
334 data->schema_nodes = vector_as_array(&storage->schema_nodes_);
335 data->property_nodes = vector_as_array(&storage->property_nodes_);
336 data->properties_nodes = vector_as_array(&storage->properties_nodes_);
337 data->restriction_nodes = vector_as_array(&storage->restriction_nodes_);
338 data->int_enums = vector_as_array(&storage->int_enums_);
339 data->string_enums = vector_as_array(&storage->string_enums_);
340 return storage;
341 }
342
CompileRegex(const std::string & pattern) const343 re2::RE2* Schema::InternalStorage::CompileRegex(
344 const std::string& pattern) const {
345 std::map<std::string, re2::RE2*>::iterator it = regex_cache_.find(pattern);
346 if (it == regex_cache_.end()) {
347 re2::RE2* compiled = new re2::RE2(pattern);
348 regex_cache_[pattern] = compiled;
349 return compiled;
350 }
351 return it->second;
352 }
353
354 // static
DetermineStorageSizes(const base::DictionaryValue & schema,StorageSizes * sizes)355 void Schema::InternalStorage::DetermineStorageSizes(
356 const base::DictionaryValue& schema,
357 StorageSizes* sizes) {
358 std::string ref_string;
359 if (schema.GetString(schema::kRef, &ref_string)) {
360 // Schemas with a "$ref" attribute don't take additional storage.
361 return;
362 }
363
364 std::string type_string;
365 base::Value::Type type = base::Value::TYPE_NULL;
366 if (!schema.GetString(schema::kType, &type_string) ||
367 !SchemaTypeToValueType(type_string, &type)) {
368 // This schema is invalid.
369 return;
370 }
371
372 sizes->schema_nodes++;
373
374 if (type == base::Value::TYPE_LIST) {
375 const base::DictionaryValue* items = NULL;
376 if (schema.GetDictionary(schema::kItems, &items))
377 DetermineStorageSizes(*items, sizes);
378 } else if (type == base::Value::TYPE_DICTIONARY) {
379 sizes->properties_nodes++;
380
381 const base::DictionaryValue* dict = NULL;
382 if (schema.GetDictionary(schema::kAdditionalProperties, &dict))
383 DetermineStorageSizes(*dict, sizes);
384
385 const base::DictionaryValue* properties = NULL;
386 if (schema.GetDictionary(schema::kProperties, &properties)) {
387 for (base::DictionaryValue::Iterator it(*properties);
388 !it.IsAtEnd(); it.Advance()) {
389 // This should have been verified by the JSONSchemaValidator.
390 CHECK(it.value().GetAsDictionary(&dict));
391 DetermineStorageSizes(*dict, sizes);
392 sizes->strings++;
393 sizes->property_nodes++;
394 }
395 }
396
397 const base::DictionaryValue* pattern_properties = NULL;
398 if (schema.GetDictionary(schema::kPatternProperties, &pattern_properties)) {
399 for (base::DictionaryValue::Iterator it(*pattern_properties);
400 !it.IsAtEnd(); it.Advance()) {
401 CHECK(it.value().GetAsDictionary(&dict));
402 DetermineStorageSizes(*dict, sizes);
403 sizes->strings++;
404 sizes->property_nodes++;
405 }
406 }
407 } else if (schema.HasKey(schema::kEnum)) {
408 const base::ListValue* possible_values = NULL;
409 if (schema.GetList(schema::kEnum, &possible_values)) {
410 if (type == base::Value::TYPE_INTEGER) {
411 sizes->int_enums += possible_values->GetSize();
412 } else if (type == base::Value::TYPE_STRING) {
413 sizes->string_enums += possible_values->GetSize();
414 sizes->strings += possible_values->GetSize();
415 }
416 sizes->restriction_nodes++;
417 }
418 } else if (type == base::Value::TYPE_INTEGER) {
419 if (schema.HasKey(schema::kMinimum) || schema.HasKey(schema::kMaximum))
420 sizes->restriction_nodes++;
421 } else if (type == base::Value::TYPE_STRING) {
422 if (schema.HasKey(schema::kPattern)) {
423 sizes->strings++;
424 sizes->string_enums++;
425 sizes->restriction_nodes++;
426 }
427 }
428 }
429
Parse(const base::DictionaryValue & schema,int * index,IdMap * id_map,ReferenceList * reference_list,std::string * error)430 bool Schema::InternalStorage::Parse(const base::DictionaryValue& schema,
431 int* index,
432 IdMap* id_map,
433 ReferenceList* reference_list,
434 std::string* error) {
435 std::string ref_string;
436 if (schema.GetString(schema::kRef, &ref_string)) {
437 std::string id_string;
438 if (schema.GetString(schema::kId, &id_string)) {
439 *error = "Schemas with a $ref can't have an id";
440 return false;
441 }
442 reference_list->push_back(std::make_pair(ref_string, index));
443 return true;
444 }
445
446 std::string type_string;
447 if (!schema.GetString(schema::kType, &type_string)) {
448 *error = "The schema type must be declared.";
449 return false;
450 }
451
452 base::Value::Type type = base::Value::TYPE_NULL;
453 if (!SchemaTypeToValueType(type_string, &type)) {
454 *error = "Type not supported: " + type_string;
455 return false;
456 }
457
458 *index = static_cast<int>(schema_nodes_.size());
459 schema_nodes_.push_back(SchemaNode());
460 SchemaNode* schema_node = &schema_nodes_.back();
461 schema_node->type = type;
462 schema_node->extra = kInvalid;
463
464 if (type == base::Value::TYPE_DICTIONARY) {
465 if (!ParseDictionary(schema, schema_node, id_map, reference_list, error))
466 return false;
467 } else if (type == base::Value::TYPE_LIST) {
468 if (!ParseList(schema, schema_node, id_map, reference_list, error))
469 return false;
470 } else if (schema.HasKey(schema::kEnum)) {
471 if (!ParseEnum(schema, type, schema_node, error))
472 return false;
473 } else if (schema.HasKey(schema::kPattern)) {
474 if (!ParseStringPattern(schema, schema_node, error))
475 return false;
476 } else if (schema.HasKey(schema::kMinimum) ||
477 schema.HasKey(schema::kMaximum)) {
478 if (type != base::Value::TYPE_INTEGER) {
479 *error = "Only integers can have minimum and maximum";
480 return false;
481 }
482 if (!ParseRangedInt(schema, schema_node, error))
483 return false;
484 }
485 std::string id_string;
486 if (schema.GetString(schema::kId, &id_string)) {
487 if (ContainsKey(*id_map, id_string)) {
488 *error = "Duplicated id: " + id_string;
489 return false;
490 }
491 (*id_map)[id_string] = *index;
492 }
493
494 return true;
495 }
496
ParseDictionary(const base::DictionaryValue & schema,SchemaNode * schema_node,IdMap * id_map,ReferenceList * reference_list,std::string * error)497 bool Schema::InternalStorage::ParseDictionary(
498 const base::DictionaryValue& schema,
499 SchemaNode* schema_node,
500 IdMap* id_map,
501 ReferenceList* reference_list,
502 std::string* error) {
503 int extra = static_cast<int>(properties_nodes_.size());
504 properties_nodes_.push_back(PropertiesNode());
505 properties_nodes_[extra].additional = kInvalid;
506 schema_node->extra = extra;
507
508 const base::DictionaryValue* dict = NULL;
509 if (schema.GetDictionary(schema::kAdditionalProperties, &dict)) {
510 if (!Parse(*dict, &properties_nodes_[extra].additional,
511 id_map, reference_list, error)) {
512 return false;
513 }
514 }
515
516 properties_nodes_[extra].begin = static_cast<int>(property_nodes_.size());
517
518 const base::DictionaryValue* properties = NULL;
519 if (schema.GetDictionary(schema::kProperties, &properties)) {
520 // This and below reserves nodes for all of the |properties|, and makes sure
521 // they are contiguous. Recursive calls to Parse() will append after these
522 // elements.
523 property_nodes_.resize(property_nodes_.size() + properties->size());
524 }
525
526 properties_nodes_[extra].end = static_cast<int>(property_nodes_.size());
527
528 const base::DictionaryValue* pattern_properties = NULL;
529 if (schema.GetDictionary(schema::kPatternProperties, &pattern_properties))
530 property_nodes_.resize(property_nodes_.size() + pattern_properties->size());
531
532 properties_nodes_[extra].pattern_end =
533 static_cast<int>(property_nodes_.size());
534
535 if (properties != NULL) {
536 int base_index = properties_nodes_[extra].begin;
537 int index = base_index;
538
539 for (base::DictionaryValue::Iterator it(*properties);
540 !it.IsAtEnd(); it.Advance(), ++index) {
541 // This should have been verified by the JSONSchemaValidator.
542 CHECK(it.value().GetAsDictionary(&dict));
543 strings_.push_back(it.key());
544 property_nodes_[index].key = strings_.back().c_str();
545 if (!Parse(*dict, &property_nodes_[index].schema,
546 id_map, reference_list, error)) {
547 return false;
548 }
549 }
550 CHECK_EQ(static_cast<int>(properties->size()), index - base_index);
551 }
552
553 if (pattern_properties != NULL) {
554 int base_index = properties_nodes_[extra].end;
555 int index = base_index;
556
557 for (base::DictionaryValue::Iterator it(*pattern_properties);
558 !it.IsAtEnd(); it.Advance(), ++index) {
559 CHECK(it.value().GetAsDictionary(&dict));
560 re2::RE2* compiled_regex = CompileRegex(it.key());
561 if (!compiled_regex->ok()) {
562 *error =
563 "/" + it.key() + "/ is a invalid regex: " + compiled_regex->error();
564 return false;
565 }
566 strings_.push_back(it.key());
567 property_nodes_[index].key = strings_.back().c_str();
568 if (!Parse(*dict, &property_nodes_[index].schema,
569 id_map, reference_list, error)) {
570 return false;
571 }
572 }
573 CHECK_EQ(static_cast<int>(pattern_properties->size()), index - base_index);
574 }
575
576 if (properties_nodes_[extra].begin == properties_nodes_[extra].pattern_end) {
577 properties_nodes_[extra].begin = kInvalid;
578 properties_nodes_[extra].end = kInvalid;
579 properties_nodes_[extra].pattern_end = kInvalid;
580 }
581
582 return true;
583 }
584
ParseList(const base::DictionaryValue & schema,SchemaNode * schema_node,IdMap * id_map,ReferenceList * reference_list,std::string * error)585 bool Schema::InternalStorage::ParseList(const base::DictionaryValue& schema,
586 SchemaNode* schema_node,
587 IdMap* id_map,
588 ReferenceList* reference_list,
589 std::string* error) {
590 const base::DictionaryValue* dict = NULL;
591 if (!schema.GetDictionary(schema::kItems, &dict)) {
592 *error = "Arrays must declare a single schema for their items.";
593 return false;
594 }
595 return Parse(*dict, &schema_node->extra, id_map, reference_list, error);
596 }
597
ParseEnum(const base::DictionaryValue & schema,base::Value::Type type,SchemaNode * schema_node,std::string * error)598 bool Schema::InternalStorage::ParseEnum(const base::DictionaryValue& schema,
599 base::Value::Type type,
600 SchemaNode* schema_node,
601 std::string* error) {
602 const base::ListValue *possible_values = NULL;
603 if (!schema.GetList(schema::kEnum, &possible_values)) {
604 *error = "Enum attribute must be a list value";
605 return false;
606 }
607 if (possible_values->empty()) {
608 *error = "Enum attribute must be non-empty";
609 return false;
610 }
611 int offset_begin;
612 int offset_end;
613 if (type == base::Value::TYPE_INTEGER) {
614 offset_begin = static_cast<int>(int_enums_.size());
615 int value;
616 for (base::ListValue::const_iterator it = possible_values->begin();
617 it != possible_values->end(); ++it) {
618 if (!(*it)->GetAsInteger(&value)) {
619 *error = "Invalid enumeration member type";
620 return false;
621 }
622 int_enums_.push_back(value);
623 }
624 offset_end = static_cast<int>(int_enums_.size());
625 } else if (type == base::Value::TYPE_STRING) {
626 offset_begin = static_cast<int>(string_enums_.size());
627 std::string value;
628 for (base::ListValue::const_iterator it = possible_values->begin();
629 it != possible_values->end(); ++it) {
630 if (!(*it)->GetAsString(&value)) {
631 *error = "Invalid enumeration member type";
632 return false;
633 }
634 strings_.push_back(value);
635 string_enums_.push_back(strings_.back().c_str());
636 }
637 offset_end = static_cast<int>(string_enums_.size());
638 } else {
639 *error = "Enumeration is only supported for integer and string.";
640 return false;
641 }
642 schema_node->extra = static_cast<int>(restriction_nodes_.size());
643 restriction_nodes_.push_back(RestrictionNode());
644 restriction_nodes_.back().enumeration_restriction.offset_begin = offset_begin;
645 restriction_nodes_.back().enumeration_restriction.offset_end = offset_end;
646 return true;
647 }
648
ParseRangedInt(const base::DictionaryValue & schema,SchemaNode * schema_node,std::string * error)649 bool Schema::InternalStorage::ParseRangedInt(
650 const base::DictionaryValue& schema,
651 SchemaNode* schema_node,
652 std::string* error) {
653 int min_value = INT_MIN;
654 int max_value = INT_MAX;
655 int value;
656 if (schema.GetInteger(schema::kMinimum, &value))
657 min_value = value;
658 if (schema.GetInteger(schema::kMaximum, &value))
659 max_value = value;
660 if (min_value > max_value) {
661 *error = "Invalid range restriction for int type.";
662 return false;
663 }
664 schema_node->extra = static_cast<int>(restriction_nodes_.size());
665 restriction_nodes_.push_back(RestrictionNode());
666 restriction_nodes_.back().ranged_restriction.max_value = max_value;
667 restriction_nodes_.back().ranged_restriction.min_value = min_value;
668 return true;
669 }
670
ParseStringPattern(const base::DictionaryValue & schema,SchemaNode * schema_node,std::string * error)671 bool Schema::InternalStorage::ParseStringPattern(
672 const base::DictionaryValue& schema,
673 SchemaNode* schema_node,
674 std::string* error) {
675 std::string pattern;
676 if (!schema.GetString(schema::kPattern, &pattern)) {
677 *error = "Schema pattern must be a string.";
678 return false;
679 }
680 re2::RE2* compiled_regex = CompileRegex(pattern);
681 if (!compiled_regex->ok()) {
682 *error = "/" + pattern + "/ is invalid regex: " + compiled_regex->error();
683 return false;
684 }
685 int index = static_cast<int>(string_enums_.size());
686 strings_.push_back(pattern);
687 string_enums_.push_back(strings_.back().c_str());
688 schema_node->extra = static_cast<int>(restriction_nodes_.size());
689 restriction_nodes_.push_back(RestrictionNode());
690 restriction_nodes_.back().string_pattern_restriction.pattern_index = index;
691 restriction_nodes_.back().string_pattern_restriction.pattern_index_backup =
692 index;
693 return true;
694 }
695
696 // static
ResolveReferences(const IdMap & id_map,const ReferenceList & reference_list,std::string * error)697 bool Schema::InternalStorage::ResolveReferences(
698 const IdMap& id_map,
699 const ReferenceList& reference_list,
700 std::string* error) {
701 for (ReferenceList::const_iterator ref = reference_list.begin();
702 ref != reference_list.end(); ++ref) {
703 IdMap::const_iterator id = id_map.find(ref->first);
704 if (id == id_map.end()) {
705 *error = "Invalid $ref: " + ref->first;
706 return false;
707 }
708 *ref->second = id->second;
709 }
710 return true;
711 }
712
Iterator(const scoped_refptr<const InternalStorage> & storage,const PropertiesNode * node)713 Schema::Iterator::Iterator(const scoped_refptr<const InternalStorage>& storage,
714 const PropertiesNode* node)
715 : storage_(storage),
716 it_(storage->property(node->begin)),
717 end_(storage->property(node->end)) {}
718
Iterator(const Iterator & iterator)719 Schema::Iterator::Iterator(const Iterator& iterator)
720 : storage_(iterator.storage_),
721 it_(iterator.it_),
722 end_(iterator.end_) {}
723
~Iterator()724 Schema::Iterator::~Iterator() {}
725
operator =(const Iterator & iterator)726 Schema::Iterator& Schema::Iterator::operator=(const Iterator& iterator) {
727 storage_ = iterator.storage_;
728 it_ = iterator.it_;
729 end_ = iterator.end_;
730 return *this;
731 }
732
IsAtEnd() const733 bool Schema::Iterator::IsAtEnd() const {
734 return it_ == end_;
735 }
736
Advance()737 void Schema::Iterator::Advance() {
738 ++it_;
739 }
740
key() const741 const char* Schema::Iterator::key() const {
742 return it_->key;
743 }
744
schema() const745 Schema Schema::Iterator::schema() const {
746 return Schema(storage_, storage_->schema(it_->schema));
747 }
748
Schema()749 Schema::Schema() : node_(NULL) {}
750
Schema(const scoped_refptr<const InternalStorage> & storage,const SchemaNode * node)751 Schema::Schema(const scoped_refptr<const InternalStorage>& storage,
752 const SchemaNode* node)
753 : storage_(storage), node_(node) {}
754
Schema(const Schema & schema)755 Schema::Schema(const Schema& schema)
756 : storage_(schema.storage_), node_(schema.node_) {}
757
~Schema()758 Schema::~Schema() {}
759
operator =(const Schema & schema)760 Schema& Schema::operator=(const Schema& schema) {
761 storage_ = schema.storage_;
762 node_ = schema.node_;
763 return *this;
764 }
765
766 // static
Wrap(const SchemaData * data)767 Schema Schema::Wrap(const SchemaData* data) {
768 scoped_refptr<const InternalStorage> storage = InternalStorage::Wrap(data);
769 return Schema(storage, storage->root_node());
770 }
771
Validate(const base::Value & value,SchemaOnErrorStrategy strategy,std::string * error_path,std::string * error) const772 bool Schema::Validate(const base::Value& value,
773 SchemaOnErrorStrategy strategy,
774 std::string* error_path,
775 std::string* error) const {
776 if (!valid()) {
777 SchemaErrorFound(error_path, error, "The schema is invalid.");
778 return false;
779 }
780
781 if (!value.IsType(type())) {
782 // Allow the integer to double promotion. Note that range restriction on
783 // double is not supported now.
784 if (value.IsType(base::Value::TYPE_INTEGER) &&
785 type() == base::Value::TYPE_DOUBLE) {
786 return true;
787 }
788
789 SchemaErrorFound(
790 error_path, error, "The value type doesn't match the schema type.");
791 return false;
792 }
793
794 const base::DictionaryValue* dict = NULL;
795 const base::ListValue* list = NULL;
796 int int_value;
797 std::string str_value;
798 if (value.GetAsDictionary(&dict)) {
799 for (base::DictionaryValue::Iterator it(*dict); !it.IsAtEnd();
800 it.Advance()) {
801 SchemaList schema_list = GetMatchingProperties(it.key());
802 if (schema_list.empty()) {
803 // Unknown property was detected.
804 SchemaErrorFound(error_path, error, "Unknown property: " + it.key());
805 if (!StrategyAllowUnknownOnTopLevel(strategy))
806 return false;
807 } else {
808 for (SchemaList::iterator subschema = schema_list.begin();
809 subschema != schema_list.end(); ++subschema) {
810 if (!subschema->Validate(it.value(),
811 StrategyForNextLevel(strategy),
812 error_path,
813 error)) {
814 // Invalid property was detected.
815 AddDictKeyPrefixToPath(it.key(), error_path);
816 if (!StrategyAllowInvalidOnTopLevel(strategy))
817 return false;
818 }
819 }
820 }
821 }
822 } else if (value.GetAsList(&list)) {
823 for (base::ListValue::const_iterator it = list->begin(); it != list->end();
824 ++it) {
825 if (!*it ||
826 !GetItems().Validate(**it,
827 StrategyForNextLevel(strategy),
828 error_path,
829 error)) {
830 // Invalid list item was detected.
831 AddListIndexPrefixToPath(it - list->begin(), error_path);
832 if (!StrategyAllowInvalidOnTopLevel(strategy))
833 return false;
834 }
835 }
836 } else if (value.GetAsInteger(&int_value)) {
837 if (node_->extra != kInvalid &&
838 !ValidateIntegerRestriction(node_->extra, int_value)) {
839 SchemaErrorFound(error_path, error, "Invalid value for integer");
840 return false;
841 }
842 } else if (value.GetAsString(&str_value)) {
843 if (node_->extra != kInvalid &&
844 !ValidateStringRestriction(node_->extra, str_value.c_str())) {
845 SchemaErrorFound(error_path, error, "Invalid value for string");
846 return false;
847 }
848 }
849
850 return true;
851 }
852
Normalize(base::Value * value,SchemaOnErrorStrategy strategy,std::string * error_path,std::string * error,bool * changed) const853 bool Schema::Normalize(base::Value* value,
854 SchemaOnErrorStrategy strategy,
855 std::string* error_path,
856 std::string* error,
857 bool* changed) const {
858 if (!valid()) {
859 SchemaErrorFound(error_path, error, "The schema is invalid.");
860 return false;
861 }
862
863 if (!value->IsType(type())) {
864 // Allow the integer to double promotion. Note that range restriction on
865 // double is not supported now.
866 if (value->IsType(base::Value::TYPE_INTEGER) &&
867 type() == base::Value::TYPE_DOUBLE) {
868 return true;
869 }
870
871 SchemaErrorFound(
872 error_path, error, "The value type doesn't match the schema type.");
873 return false;
874 }
875
876 base::DictionaryValue* dict = NULL;
877 base::ListValue* list = NULL;
878 if (value->GetAsDictionary(&dict)) {
879 std::vector<std::string> drop_list; // Contains the keys to drop.
880 for (base::DictionaryValue::Iterator it(*dict); !it.IsAtEnd();
881 it.Advance()) {
882 SchemaList schema_list = GetMatchingProperties(it.key());
883 if (schema_list.empty()) {
884 // Unknown property was detected.
885 SchemaErrorFound(error_path, error, "Unknown property: " + it.key());
886 if (StrategyAllowUnknownOnTopLevel(strategy))
887 drop_list.push_back(it.key());
888 else
889 return false;
890 } else {
891 for (SchemaList::iterator subschema = schema_list.begin();
892 subschema != schema_list.end(); ++subschema) {
893 base::Value* sub_value = NULL;
894 dict->GetWithoutPathExpansion(it.key(), &sub_value);
895 if (!subschema->Normalize(sub_value,
896 StrategyForNextLevel(strategy),
897 error_path,
898 error,
899 changed)) {
900 // Invalid property was detected.
901 AddDictKeyPrefixToPath(it.key(), error_path);
902 if (StrategyAllowInvalidOnTopLevel(strategy)) {
903 drop_list.push_back(it.key());
904 break;
905 } else {
906 return false;
907 }
908 }
909 }
910 }
911 }
912 if (changed && !drop_list.empty())
913 *changed = true;
914 for (std::vector<std::string>::const_iterator it = drop_list.begin();
915 it != drop_list.end();
916 ++it) {
917 dict->RemoveWithoutPathExpansion(*it, NULL);
918 }
919 return true;
920 } else if (value->GetAsList(&list)) {
921 std::vector<size_t> drop_list; // Contains the indexes to drop.
922 for (size_t index = 0; index < list->GetSize(); index++) {
923 base::Value* sub_value = NULL;
924 list->Get(index, &sub_value);
925 if (!sub_value || !GetItems().Normalize(sub_value,
926 StrategyForNextLevel(strategy),
927 error_path,
928 error,
929 changed)) {
930 // Invalid list item was detected.
931 AddListIndexPrefixToPath(index, error_path);
932 if (StrategyAllowInvalidOnTopLevel(strategy))
933 drop_list.push_back(index);
934 else
935 return false;
936 }
937 }
938 if (changed && !drop_list.empty())
939 *changed = true;
940 for (std::vector<size_t>::reverse_iterator it = drop_list.rbegin();
941 it != drop_list.rend(); ++it) {
942 list->Remove(*it, NULL);
943 }
944 return true;
945 }
946
947 return Validate(*value, strategy, error_path, error);
948 }
949
950 // static
Parse(const std::string & content,std::string * error)951 Schema Schema::Parse(const std::string& content, std::string* error) {
952 // Validate as a generic JSON schema, and ignore unknown attributes; they
953 // may become used in a future version of the schema format.
954 scoped_ptr<base::DictionaryValue> dict = JSONSchemaValidator::IsValidSchema(
955 content, JSONSchemaValidator::OPTIONS_IGNORE_UNKNOWN_ATTRIBUTES, error);
956 if (!dict)
957 return Schema();
958
959 // Validate the main type.
960 std::string string_value;
961 if (!dict->GetString(schema::kType, &string_value) ||
962 string_value != schema::kObject) {
963 *error =
964 "The main schema must have a type attribute with \"object\" value.";
965 return Schema();
966 }
967
968 // Checks for invalid attributes at the top-level.
969 if (dict->HasKey(schema::kAdditionalProperties) ||
970 dict->HasKey(schema::kPatternProperties)) {
971 *error = "\"additionalProperties\" and \"patternProperties\" are not "
972 "supported at the main schema.";
973 return Schema();
974 }
975
976 scoped_refptr<const InternalStorage> storage =
977 InternalStorage::ParseSchema(*dict, error);
978 if (!storage.get())
979 return Schema();
980 return Schema(storage, storage->root_node());
981 }
982
type() const983 base::Value::Type Schema::type() const {
984 CHECK(valid());
985 return node_->type;
986 }
987
GetPropertiesIterator() const988 Schema::Iterator Schema::GetPropertiesIterator() const {
989 CHECK(valid());
990 CHECK_EQ(base::Value::TYPE_DICTIONARY, type());
991 return Iterator(storage_, storage_->properties(node_->extra));
992 }
993
994 namespace {
995
CompareKeys(const PropertyNode & node,const std::string & key)996 bool CompareKeys(const PropertyNode& node, const std::string& key) {
997 return node.key < key;
998 }
999
1000 } // namespace
1001
GetKnownProperty(const std::string & key) const1002 Schema Schema::GetKnownProperty(const std::string& key) const {
1003 CHECK(valid());
1004 CHECK_EQ(base::Value::TYPE_DICTIONARY, type());
1005 const PropertiesNode* node = storage_->properties(node_->extra);
1006 const PropertyNode* begin = storage_->property(node->begin);
1007 const PropertyNode* end = storage_->property(node->end);
1008 const PropertyNode* it = std::lower_bound(begin, end, key, CompareKeys);
1009 if (it != end && it->key == key)
1010 return Schema(storage_, storage_->schema(it->schema));
1011 return Schema();
1012 }
1013
GetAdditionalProperties() const1014 Schema Schema::GetAdditionalProperties() const {
1015 CHECK(valid());
1016 CHECK_EQ(base::Value::TYPE_DICTIONARY, type());
1017 const PropertiesNode* node = storage_->properties(node_->extra);
1018 if (node->additional == kInvalid)
1019 return Schema();
1020 return Schema(storage_, storage_->schema(node->additional));
1021 }
1022
GetPatternProperties(const std::string & key) const1023 SchemaList Schema::GetPatternProperties(const std::string& key) const {
1024 CHECK(valid());
1025 CHECK_EQ(base::Value::TYPE_DICTIONARY, type());
1026 const PropertiesNode* node = storage_->properties(node_->extra);
1027 const PropertyNode* begin = storage_->property(node->end);
1028 const PropertyNode* end = storage_->property(node->pattern_end);
1029 SchemaList matching_properties;
1030 for (const PropertyNode* it = begin; it != end; ++it) {
1031 if (re2::RE2::PartialMatch(key, *storage_->CompileRegex(it->key))) {
1032 matching_properties.push_back(
1033 Schema(storage_, storage_->schema(it->schema)));
1034 }
1035 }
1036 return matching_properties;
1037 }
1038
GetProperty(const std::string & key) const1039 Schema Schema::GetProperty(const std::string& key) const {
1040 Schema schema = GetKnownProperty(key);
1041 if (schema.valid())
1042 return schema;
1043 return GetAdditionalProperties();
1044 }
1045
GetMatchingProperties(const std::string & key) const1046 SchemaList Schema::GetMatchingProperties(const std::string& key) const {
1047 SchemaList schema_list;
1048
1049 Schema known_property = GetKnownProperty(key);
1050 if (known_property.valid())
1051 schema_list.push_back(known_property);
1052
1053 SchemaList pattern_properties = GetPatternProperties(key);
1054 schema_list.insert(
1055 schema_list.end(), pattern_properties.begin(), pattern_properties.end());
1056
1057 if (schema_list.empty()) {
1058 Schema additional_property = GetAdditionalProperties();
1059 if (additional_property.valid())
1060 schema_list.push_back(additional_property);
1061 }
1062
1063 return schema_list;
1064 }
1065
GetItems() const1066 Schema Schema::GetItems() const {
1067 CHECK(valid());
1068 CHECK_EQ(base::Value::TYPE_LIST, type());
1069 if (node_->extra == kInvalid)
1070 return Schema();
1071 return Schema(storage_, storage_->schema(node_->extra));
1072 }
1073
ValidateIntegerRestriction(int index,int value) const1074 bool Schema::ValidateIntegerRestriction(int index, int value) const {
1075 const RestrictionNode* rnode = storage_->restriction(index);
1076 if (rnode->ranged_restriction.min_value <=
1077 rnode->ranged_restriction.max_value) {
1078 return rnode->ranged_restriction.min_value <= value &&
1079 rnode->ranged_restriction.max_value >= value;
1080 } else {
1081 for (int i = rnode->enumeration_restriction.offset_begin;
1082 i < rnode->enumeration_restriction.offset_end; ++i) {
1083 if (*storage_->int_enums(i) == value)
1084 return true;
1085 }
1086 return false;
1087 }
1088 }
1089
ValidateStringRestriction(int index,const char * str) const1090 bool Schema::ValidateStringRestriction(int index, const char* str) const {
1091 const RestrictionNode* rnode = storage_->restriction(index);
1092 if (rnode->enumeration_restriction.offset_begin <
1093 rnode->enumeration_restriction.offset_end) {
1094 for (int i = rnode->enumeration_restriction.offset_begin;
1095 i < rnode->enumeration_restriction.offset_end; ++i) {
1096 if (strcmp(*storage_->string_enums(i), str) == 0)
1097 return true;
1098 }
1099 return false;
1100 } else {
1101 int index = rnode->string_pattern_restriction.pattern_index;
1102 DCHECK(index == rnode->string_pattern_restriction.pattern_index_backup);
1103 re2::RE2* regex = storage_->CompileRegex(*storage_->string_enums(index));
1104 return re2::RE2::PartialMatch(str, *regex);
1105 }
1106 }
1107
1108 } // namespace policy
1109