| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643 |
- #pragma once
- #include <tuple>
- #include <unordered_map>
- #include <jvalidate/constraint/array_constraint.h>
- #include <jvalidate/constraint/general_constraint.h>
- #include <jvalidate/constraint/number_constraint.h>
- #include <jvalidate/constraint/object_constraint.h>
- #include <jvalidate/constraint/string_constraint.h>
- #include <jvalidate/constraint/visitor.h>
- #include <jvalidate/detail/expect.h>
- #include <jvalidate/detail/iostream.h>
- #include <jvalidate/detail/number.h>
- #include <jvalidate/detail/pointer.h>
- #include <jvalidate/forward.h>
- #include <jvalidate/schema.h>
- #include <jvalidate/status.h>
- #include <jvalidate/validation_config.h>
- #include <jvalidate/validation_result.h>
- #define VISITED(type) std::get<std::unordered_set<type>>(*visited_)
- #define NOOP_UNLESS_TYPE(etype) \
- RETURN_UNLESS(adapter::Type::etype == document_.type(), Status::Noop)
- #define BREAK_EARLY_IF_NO_RESULT_TREE() \
- do { \
- if (rval == Status::Reject and not result_ and not visited_) { \
- break; \
- } \
- } while (false)
- namespace jvalidate {
- template <Adapter A, RegexEngine RE>
- class ValidationVisitor : public constraint::ConstraintVisitor {
- private:
- using VisitedAnnotation = std::tuple<std::unordered_set<size_t>, std::unordered_set<std::string>>;
- private:
- A document_;
- detail::Pointer where_;
- detail::Pointer schema_path_;
- schema::Node const * schema_;
- ValidationResult * result_;
- ValidationConfig const & cfg_;
- std::unordered_map<std::string, RE> & regex_cache_;
- mutable VisitedAnnotation * visited_ = nullptr;
- public:
- ValidationVisitor(A const & json, schema::Node const & schema, ValidationConfig const & cfg,
- std::unordered_map<std::string, RE> & regex_cache, ValidationResult * result)
- : document_(json), schema_(&schema), result_(result), cfg_(cfg), regex_cache_(regex_cache) {}
- Status visit(constraint::TypeConstraint const & cons) const {
- adapter::Type const type = document_.type();
- for (adapter::Type const accept : cons.types) {
- if (type == accept) {
- return Status::Accept;
- }
- if (accept == adapter::Type::Number && type == adapter::Type::Integer) {
- return Status::Accept;
- }
- if (accept == adapter::Type::Integer && type == adapter::Type::Number &&
- detail::is_json_integer(document_.as_number())) {
- return Status::Accept;
- }
- }
- add_error("type ", type, " is not one of {", cons.types, "}");
- return Status::Reject;
- }
- Status visit(constraint::ExtensionConstraint const & cons) const {
- return cons.validate(document_, where_, result_);
- }
- Status visit(constraint::EnumConstraint const & cons) const {
- auto is_equal = [this](auto const & frozen) {
- return document_.equals(frozen, cfg_.strict_equality);
- };
- for (auto const & option : cons.enumeration) {
- if (option->apply(is_equal)) {
- return Status::Accept;
- }
- }
- add_error("equals none of the values");
- return Status::Reject;
- }
- Status visit(constraint::AllOfConstraint const & cons) const {
- Status rval = Status::Accept;
- std::set<size_t> unmatched;
- size_t i = 0;
- for (auto const & subschema : cons.children) {
- if (auto stat = validate_subschema(subschema, i); stat == Status::Reject) {
- rval = Status::Reject;
- unmatched.insert(i);
- }
- ++i;
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- if (rval == Status::Reject) {
- add_error("does not validate subschemas ", unmatched);
- }
- return rval;
- }
- Status visit(constraint::AnyOfConstraint const & cons) const {
- size_t i = 0;
- Status rval = Status::Reject;
- for (auto const & subschema : cons.children) {
- if (validate_subschema(subschema, i)) {
- rval = Status::Accept;
- }
- if (not visited_ && rval == Status::Accept) {
- break;
- }
- ++i;
- }
- if (rval == Status::Reject) {
- add_error("validates none of the subschemas");
- }
- return rval;
- }
- Status visit(constraint::OneOfConstraint const & cons) const {
- std::set<size_t> matches;
- size_t i = 0;
- for (schema::Node const * subschema : cons.children) {
- if (validate_subschema(subschema, i)) {
- matches.insert(i);
- }
- ++i;
- }
- if (matches.size() == 1) {
- return Status::Accept;
- }
- add_error("validates subschemas ", matches);
- return Status::Reject;
- }
- Status visit(constraint::NotConstraint const & cons) const {
- VisitedAnnotation * suppress = nullptr;
- std::swap(suppress, visited_);
- bool const rval = validate_subschema(cons.child) == Status::Reject;
- std::swap(suppress, visited_);
- if (not rval) {
- add_error("actually validates subschema");
- }
- return rval;
- }
- Status visit(constraint::ConditionalConstraint const & cons) const {
- VisitedAnnotation * suppress = nullptr;
- std::swap(suppress, visited_);
- bool const if_result(validate_subschema(cons.if_constraint));
- std::swap(suppress, visited_);
- if (if_result) {
- return validate_subschema(cons.then_constraint, detail::parent, "then");
- }
- return validate_subschema(cons.else_constraint, detail::parent, "else");
- }
- Status visit(constraint::MaximumConstraint const & cons) const {
- switch (document_.type()) {
- case adapter::Type::Integer:
- if (int64_t value = document_.as_integer(); not cons(value)) {
- add_error("integer ", value, " exceeds ", cons.exclusive ? "exclusive " : "", "maximum of ",
- cons.value);
- return false;
- }
- return true;
- case adapter::Type::Number:
- if (double value = document_.as_number(); not cons(value)) {
- add_error("number ", value, " exceeds ", cons.exclusive ? "exclusive " : "", "maximum of ",
- cons.value);
- return false;
- }
- return true;
- default:
- return Status::Noop;
- }
- }
- Status visit(constraint::MinimumConstraint const & cons) const {
- switch (document_.type()) {
- case adapter::Type::Integer:
- if (int64_t value = document_.as_integer(); not cons(value)) {
- add_error("integer ", value, " fails ", cons.exclusive ? "exclusive " : "", "minimum of ",
- cons.value);
- return false;
- }
- return true;
- case adapter::Type::Number:
- if (double value = document_.as_number(); not cons(value)) {
- add_error("number ", value, " fails ", cons.exclusive ? "exclusive " : "", "minimum of ",
- cons.value);
- return false;
- }
- return true;
- default:
- return Status::Noop;
- }
- }
- Status visit(constraint::MultipleOfConstraint const & cons) const {
- adapter::Type const type = document_.type();
- RETURN_UNLESS(type == adapter::Type::Number || type == adapter::Type::Integer, Status::Noop);
- if (double value = document_.as_number(); not cons(value)) {
- add_error("number ", value, " is not a multiple of ", cons.value);
- return false;
- }
- return true;
- }
- Status visit(constraint::MaxLengthConstraint const & cons) const {
- NOOP_UNLESS_TYPE(String);
- if (auto str = document_.as_string(); detail::length(str) > cons.value) {
- add_error("string '", str, "' is greater than the maximum length of ", cons.value);
- return false;
- }
- return true;
- }
- Status visit(constraint::MinLengthConstraint const & cons) const {
- NOOP_UNLESS_TYPE(String);
- if (auto str = document_.as_string(); detail::length(str) < cons.value) {
- add_error("string '", str, "' is less than the minimum length of ", cons.value);
- return false;
- }
- return true;
- }
- Status visit(constraint::PatternConstraint const & cons) const {
- NOOP_UNLESS_TYPE(String);
- RE const & regex = regex_cache_.try_emplace(cons.regex, cons.regex).first->second;
- if (auto str = document_.as_string(); not regex.search(str)) {
- add_error("string '", str, "' does not match pattern /", cons.regex, "/");
- return false;
- }
- return true;
- }
- Status visit(constraint::FormatConstraint const & cons) const {
- // https://json-schema.org/draft/2020-12/draft-bhutton-json-schema-validation-01#name-defined-formats
- NOOP_UNLESS_TYPE(String);
- if (not cfg_.validate_format && not cons.is_assertion) {
- return true;
- }
- add_error("unimplemented format assertion: '", cons.format, "'");
- return false;
- }
- Status visit(constraint::AdditionalItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- auto array = document_.as_array();
- Status rval = Status::Accept;
- for (size_t i = cons.applies_after_nth; i < array.size(); ++i) {
- rval &= validate_subschema_on(cons.subschema, array[i], i);
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::ContainsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- auto array = document_.as_array();
- size_t const minimum = cons.minimum.value_or(1);
- size_t const maximum = cons.maximum.value_or(array.size());
- size_t matches = 0;
- for (size_t i = 0; i < array.size(); ++i) {
- if (validate_subschema_on(cons.subschema, array[i], i)) {
- ++matches;
- }
- }
- if (matches < minimum) {
- add_error("array does not contain at least ", minimum, " matching elements");
- return Status::Reject;
- }
- if (matches > maximum) {
- add_error("array contains more than ", maximum, " matching elements");
- return Status::Reject;
- }
- return Status::Accept;
- }
- Status visit(constraint::MaxItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- if (auto size = document_.array_size(); size > cons.value) {
- add_error("array with ", size, " items is greater than the maximum of ", cons.value);
- return false;
- }
- return true;
- }
- Status visit(constraint::MinItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- if (auto size = document_.array_size(); size < cons.value) {
- add_error("array with ", size, " items is less than the minimum of ", cons.value);
- return false;
- }
- return true;
- }
- Status visit(constraint::TupleConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- Status rval = Status::Accept;
- auto array = document_.as_array();
- size_t const n = std::min(cons.items.size(), array.size());
- for (size_t i = 0; i < n; ++i) {
- rval &= validate_subschema_on(cons.items[i], array[i], i);
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::UniqueItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- if constexpr (std::totally_ordered<A>) {
- std::set<A> cache;
- for (A const & elem : document_.as_array()) {
- if (not cache.insert(elem).second) {
- add_error("array contains duplicate elements");
- return Status::Reject;
- }
- }
- } else {
- auto array = document_.as_array();
- for (size_t i = 0; i < array.size(); ++i) {
- for (size_t j = i + 1; j < array.size(); ++j) {
- if (array[i].equals(array[j], true)) {
- add_error("array elements ", i, " and ", j, " are equal");
- return Status::Reject;
- }
- }
- }
- }
- return Status::Accept;
- }
- Status visit(constraint::AdditionalPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- auto matches_any_pattern = [this, &cons](std::string const & key) {
- for (auto & pattern : cons.patterns) {
- RE const & regex = regex_cache_.try_emplace(pattern, pattern).first->second;
- if (regex.search(key)) {
- return true;
- }
- }
- return false;
- };
- Status rval = Status::Accept;
- for (auto const & [key, elem] : document_.as_object()) {
- if (not cons.properties.contains(key) && not matches_any_pattern(key)) {
- rval &= validate_subschema_on(cons.subschema, elem, key);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::DependenciesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- auto object = document_.as_object();
- Status rval = Status::Accept;
- for (auto const & [key, subschema] : cons.subschemas) {
- if (not object.contains(key)) {
- continue;
- }
- rval &= validate_subschema(subschema, key);
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- for (auto [key, required] : cons.required) {
- if (not object.contains(key)) {
- continue;
- }
- for (auto const & [key, _] : object) {
- required.erase(key);
- }
- rval &= required.empty();
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::MaxPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- if (auto size = document_.object_size(); size > cons.value) {
- add_error("object with ", size, " properties is greater than the maximum of ", cons.value);
- return false;
- }
- return true;
- }
- Status visit(constraint::MinPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- if (auto size = document_.object_size(); size < cons.value) {
- add_error("object with ", size, " properties is less than the minimum of ", cons.value);
- return false;
- }
- return true;
- }
- Status visit(constraint::PatternPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- Status rval = Status::Accept;
- for (auto const & [pattern, subschema] : cons.properties) {
- RE const & regex = regex_cache_.try_emplace(pattern, pattern).first->second;
- for (auto const & [key, elem] : document_.as_object()) {
- if (regex.search(key)) {
- rval &= validate_subschema_on(subschema, elem, key);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- }
- return rval;
- }
- Status visit(constraint::PropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- Status rval = Status::Accept;
- auto object = document_.as_object();
- if constexpr (MutableAdapter<A>) {
- for (auto const & [key, subschema] : cons.properties) {
- auto const * default_value = subschema->default_value();
- if (default_value && not object.contains(key)) {
- object.assign(key, *default_value);
- }
- }
- }
- for (auto const & [key, elem] : object) {
- if (auto it = cons.properties.find(key); it != cons.properties.end()) {
- rval &= validate_subschema_on(it->second, elem, key);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::PropertyNamesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- Status rval = Status::Accept;
- for (auto const & [key, _] : document_.as_object()) {
- // TODO(samjaffe): Should we prefer a std::string adapter like valijson?
- typename A::value_type key_json{key};
- rval &= validate_subschema_on(cons.key_schema, A(key_json), std::string("$$key"));
- }
- return rval;
- }
- Status visit(constraint::RequiredConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- auto required = cons.properties;
- for (auto const & [key, _] : document_.as_object()) {
- required.erase(key);
- }
- if (required.empty()) {
- return Status::Accept;
- }
- add_error("missing required properties ", required);
- return Status::Reject;
- }
- Status visit(constraint::UnevaluatedItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- if (not visited_) {
- return Status::Reject;
- }
- Status rval = Status::Accept;
- auto array = document_.as_array();
- for (size_t i = 0; i < array.size(); ++i) {
- if (not VISITED(size_t).contains(i)) {
- rval &= validate_subschema_on(cons.subschema, array[i], i);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::UnevaluatedPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- if (not visited_) {
- return Status::Reject;
- }
- Status rval = Status::Accept;
- for (auto const & [key, elem] : document_.as_object()) {
- if (not VISITED(std::string).contains(key)) {
- rval &= validate_subschema_on(cons.subschema, elem, key);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status validate() {
- if (auto const & reject = schema_->rejects_all()) {
- add_error(*reject);
- return Status::Reject;
- }
- if (schema_->accepts_all()) {
- // An accept-all schema is not No-Op for the purpose of unevaluated*
- return Status::Accept;
- }
- VisitedAnnotation annotate;
- if (schema_->requires_result_context() and not visited_) {
- visited_ = &annotate;
- }
- Status rval = Status::Noop;
- if (auto ref = schema_->reference_schema()) {
- rval = validate_subschema(*ref, "$ref");
- }
- detail::Pointer const current_schema = schema_path_;
- for (auto const & [key, p_constraint] : schema_->constraints()) {
- BREAK_EARLY_IF_NO_RESULT_TREE();
- schema_path_ = current_schema / key;
- rval &= p_constraint->accept(*this);
- }
- for (auto const & [key, p_constraint] : schema_->post_constraints()) {
- BREAK_EARLY_IF_NO_RESULT_TREE();
- schema_path_ = current_schema / key;
- rval &= p_constraint->accept(*this);
- }
- return rval;
- }
- private:
- template <typename... Args> void add_error(Args &&... args) const {
- if (not result_) {
- return;
- }
- std::stringstream ss;
- using ::jvalidate::operator<<;
- [[maybe_unused]] int _[] = {(ss << std::forward<Args>(args), 0)...};
- result_->add_error(where_, schema_path_, ss.str());
- }
- template <typename C> static void merge_visited(C & to, C const & from) {
- to.insert(from.begin(), from.end());
- }
- template <typename... K>
- Status validate_subschema(constraint::Constraint::SubConstraint const & subschema,
- K const &... keys) const {
- if (schema::Node const * const * ppschema = std::get_if<0>(&subschema)) {
- return validate_subschema(*ppschema, keys...);
- } else {
- return std::get<1>(subschema)->accept(*this);
- }
- }
- template <typename... K>
- Status validate_subschema(schema::Node const * subschema, K const &... keys) const {
- VisitedAnnotation annotate;
- ValidationVisitor next = *this;
- ((next.schema_path_ /= keys), ...);
- std::tie(next.schema_, next.visited_) =
- std::forward_as_tuple(subschema, visited_ ? &annotate : nullptr);
- Status rval = next.validate();
- if (rval == Status::Accept and visited_) {
- merge_visited(std::get<0>(*visited_), std::get<0>(annotate));
- merge_visited(std::get<1>(*visited_), std::get<1>(annotate));
- }
- return rval;
- }
- template <typename K>
- Status validate_subschema_on(schema::Node const * subschema, A const & document,
- K const & key) const {
- ValidationResult result;
- ValidationVisitor next = *this;
- next.where_ /= key;
- std::tie(next.document_, next.schema_, next.result_, next.visited_) =
- std::forward_as_tuple(document, subschema, result_ ? &result : nullptr, nullptr);
- auto status = next.validate();
- if (status == Status::Accept and visited_) {
- VISITED(K).insert(key);
- }
- if (status == Status::Reject and result_) {
- result_->add_error(std::move(result));
- }
- return status;
- }
- };
- }
|