| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657 |
- #pragma once
- #include <tuple>
- #include <unordered_map>
- #include <jvalidate/constraint/array_constraint.h>
- #include <jvalidate/constraint/general_constraint.h>
- #include <jvalidate/constraint/number_constraint.h>
- #include <jvalidate/constraint/object_constraint.h>
- #include <jvalidate/constraint/string_constraint.h>
- #include <jvalidate/constraint/visitor.h>
- #include <jvalidate/detail/enumerate.h>
- #include <jvalidate/detail/expect.h>
- #include <jvalidate/detail/iostream.h>
- #include <jvalidate/detail/number.h>
- #include <jvalidate/detail/pointer.h>
- #include <jvalidate/detail/scoped_state.h>
- #include <jvalidate/forward.h>
- #include <jvalidate/schema.h>
- #include <jvalidate/status.h>
- #include <jvalidate/validation_config.h>
- #include <jvalidate/validation_result.h>
- #define VISITED(type) std::get<std::unordered_set<type>>(*visited_)
- #define NOOP_UNLESS_TYPE(etype) \
- RETURN_UNLESS(adapter::Type::etype == document_.type(), Status::Noop)
- #define BREAK_EARLY_IF_NO_RESULT_TREE() \
- do { \
- if (rval == Status::Reject and not result_ and not visited_) { \
- break; \
- } \
- } while (false)
- namespace jvalidate {
- template <Adapter A, RegexEngine RE>
- class ValidationVisitor : public constraint::ConstraintVisitor {
- private:
- using VisitedAnnotation = std::tuple<std::unordered_set<size_t>, std::unordered_set<std::string>>;
- JVALIDATE_TRIBOOL_TYPE(StoreResults, ForValid, ForInvalid, ForAnything);
- private:
- A document_;
- detail::Pointer where_;
- detail::Pointer schema_path_;
- schema::Node const * schema_;
- ValidationResult * result_;
- ValidationConfig const & cfg_;
- std::unordered_map<std::string, RE> & regex_cache_;
- mutable VisitedAnnotation * visited_ = nullptr;
- mutable StoreResults tracking_ = StoreResults::ForInvalid;
- public:
- ValidationVisitor(A const & json, schema::Node const & schema, ValidationConfig const & cfg,
- std::unordered_map<std::string, RE> & regex_cache, ValidationResult * result)
- : document_(json), schema_(&schema), result_(result), cfg_(cfg), regex_cache_(regex_cache) {}
- Status visit(constraint::TypeConstraint const & cons) const {
- adapter::Type const type = document_.type();
- for (adapter::Type const accept : cons.types) {
- if (type == accept) {
- return note(Status::Accept, "type ", type, " is one of [", cons.types, "]");
- }
- if (accept == adapter::Type::Number && type == adapter::Type::Integer) {
- return note(Status::Accept, "type ", type, " is one of [", cons.types, "]");
- }
- if (accept == adapter::Type::Integer && type == adapter::Type::Number &&
- detail::is_json_integer(document_.as_number())) {
- return note(Status::Accept, "type ", type, " is one of [", cons.types, "]");
- }
- }
- return note(Status::Reject, "type ", type, " is not one of [", cons.types, "]");
- }
- Status visit(constraint::ExtensionConstraint const & cons) const {
- return cons.validate(document_, where_, result_);
- }
- Status visit(constraint::EnumConstraint const & cons) const {
- auto is_equal = [this](auto const & frozen) {
- return document_.equals(frozen, cfg_.strict_equality);
- };
- size_t index = 0;
- for (auto const & option : cons.enumeration) {
- if (option->apply(is_equal)) {
- return note(Status::Accept, "value is enum ", index);
- }
- ++index;
- }
- return note(Status::Reject, "value is none of the enums");
- }
- Status visit(constraint::AllOfConstraint const & cons) const {
- Status rval = Status::Accept;
- std::set<size_t> unmatched;
- for (auto const & [index, subschema] : detail::enumerate(cons.children)) {
- if (auto stat = validate_subschema(subschema, index); stat == Status::Reject) {
- rval = Status::Reject;
- unmatched.insert(index);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- if (rval == Status::Reject) {
- return note(rval, "does not validate subschemas ", unmatched);
- }
- return note(rval, "validates all subschemas");
- }
- Status visit(constraint::AnyOfConstraint const & cons) const {
- std::optional<size_t> first_validated;
- for (auto const & [index, subschema] : detail::enumerate(cons.children)) {
- if (validate_subschema(subschema, index)) {
- first_validated = index;
- }
- if (not visited_ && first_validated.has_value()) {
- break;
- }
- }
- if (first_validated.has_value()) {
- return note(Status::Accept, "validates subschema ", *first_validated);
- }
- return note(Status::Reject, "validates none of the subschemas");
- }
- Status visit(constraint::OneOfConstraint const & cons) const {
- scoped_state(tracking_, StoreResults::ForAnything);
- std::set<size_t> matches;
- for (auto const & [index, subschema] : detail::enumerate(cons.children)) {
- if (validate_subschema(subschema, index)) {
- matches.insert(index);
- }
- }
- if (matches.size() == 1) {
- return note(Status::Accept, "validates subschema ", *matches.begin());
- }
- return note(Status::Reject, "validates multiple subschemas ", matches);
- }
- Status visit(constraint::NotConstraint const & cons) const {
- scoped_state(visited_, nullptr);
- scoped_state(tracking_, !tracking_);
- bool const rejected = validate_subschema(cons.child) == Status::Reject;
- if (not rejected) {
- annotate("actually validates subschema");
- }
- return rejected;
- }
- Status visit(constraint::ConditionalConstraint const & cons) const {
- bool const if_true = [this, &cons]() {
- scoped_state(tracking_, StoreResults::ForAnything);
- return validate_subschema(cons.if_constraint);
- }();
- if (if_true) {
- return validate_subschema(cons.then_constraint, detail::parent, "then");
- }
- return validate_subschema(cons.else_constraint, detail::parent, "else");
- }
- Status visit(constraint::MaximumConstraint const & cons) const {
- switch (document_.type()) {
- case adapter::Type::Integer:
- if (int64_t value = document_.as_integer(); not cons(value)) {
- return note(Status::Reject, value, cons.exclusive ? " >= " : " > ", cons.value);
- } else {
- return note(Status::Accept, value, cons.exclusive ? " < " : " <= ", cons.value);
- }
- case adapter::Type::Number:
- if (double value = document_.as_number(); not cons(value)) {
- return note(Status::Reject, value, cons.exclusive ? " >= " : " > ", cons.value);
- } else {
- return note(Status::Accept, value, cons.exclusive ? " < " : " <= ", cons.value);
- }
- default:
- return Status::Noop;
- }
- }
- Status visit(constraint::MinimumConstraint const & cons) const {
- switch (document_.type()) {
- case adapter::Type::Integer:
- if (int64_t value = document_.as_integer(); not cons(value)) {
- return note(Status::Reject, value, cons.exclusive ? " <= " : " < ", cons.value);
- } else {
- return note(Status::Accept, value, cons.exclusive ? " > " : " >= ", cons.value);
- }
- case adapter::Type::Number:
- if (double value = document_.as_number(); not cons(value)) {
- return note(Status::Reject, value, cons.exclusive ? " <= " : " < ", cons.value);
- } else {
- return note(Status::Accept, value, cons.exclusive ? " > " : " >= ", cons.value);
- }
- default:
- return Status::Noop;
- }
- }
- Status visit(constraint::MultipleOfConstraint const & cons) const {
- adapter::Type const type = document_.type();
- RETURN_UNLESS(type == adapter::Type::Number || type == adapter::Type::Integer, Status::Noop);
- if (double value = document_.as_number(); not cons(value)) {
- return note(Status::Reject, value, " is not a multiple of ", cons.value);
- } else {
- return note(Status::Accept, value, " is a multiple of ", cons.value);
- }
- }
- Status visit(constraint::MaxLengthConstraint const & cons) const {
- NOOP_UNLESS_TYPE(String);
- std::string const str = document_.as_string();
- if (int64_t len = detail::length(str); len > cons.value) {
- return note(Status::Reject, "'", str, "' of length ", len, " is >", cons.value);
- } else {
- return note(Status::Accept, "'", str, "' of length ", len, " is <=", cons.value);
- }
- }
- Status visit(constraint::MinLengthConstraint const & cons) const {
- NOOP_UNLESS_TYPE(String);
- std::string const str = document_.as_string();
- if (int64_t len = detail::length(str); len > cons.value) {
- return note(Status::Reject, "'", str, "' of length ", len, " is <", cons.value);
- } else {
- return note(Status::Accept, "'", str, "' of length ", len, " is >=", cons.value);
- }
- }
- Status visit(constraint::PatternConstraint const & cons) const {
- NOOP_UNLESS_TYPE(String);
- RE const & regex = regex_cache_.try_emplace(cons.regex, cons.regex).first->second;
- std::string const str = document_.as_string();
- if (regex.search(str)) {
- return note(Status::Accept, "'", str, "' matches pattern /", cons.regex, "/");
- }
- return note(Status::Reject, "'", str, "' does not match pattern /", cons.regex, "/");
- }
- Status visit(constraint::FormatConstraint const & cons) const {
- // https://json-schema.org/draft/2020-12/draft-bhutton-json-schema-validation-01#name-defined-formats
- NOOP_UNLESS_TYPE(String);
- // TODO(samjaffe): annotate(cons.format)
- annotate("format '", cons.format, "'");
- if (not cfg_.validate_format && not cons.is_assertion) {
- return true;
- }
- return note(Status::Reject, " is unimplemented");
- }
- Status visit(constraint::AdditionalItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- auto array = document_.as_array();
- Status rval = Status::Accept;
- for (size_t i = cons.applies_after_nth; i < array.size(); ++i) {
- rval &= validate_subschema_on(cons.subschema, array[i], i);
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::ContainsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- auto array = document_.as_array();
- size_t const minimum = cons.minimum.value_or(1);
- size_t const maximum = cons.maximum.value_or(array.size());
- size_t matches = 0;
- for (size_t i = 0; i < array.size(); ++i) {
- if (validate_subschema_on(cons.subschema, array[i], i)) {
- ++matches;
- }
- }
- if (matches < minimum) {
- return note(Status::Reject, "array contains <", minimum, " matching elements");
- }
- if (matches > maximum) {
- return note(Status::Reject, "array contains >", maximum, " matching elements");
- }
- return Status::Accept;
- }
- Status visit(constraint::MaxItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- if (size_t size = document_.array_size(); size > cons.value) {
- return note(Status::Reject, "array of size ", size, " is >", cons.value);
- } else {
- return note(Status::Accept, "array of size ", size, " is <=", cons.value);
- }
- }
- Status visit(constraint::MinItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- if (size_t size = document_.array_size(); size > cons.value) {
- return note(Status::Reject, "array of size ", size, " is <", cons.value);
- } else {
- return note(Status::Accept, "array of size ", size, " is >=", cons.value);
- }
- }
- Status visit(constraint::TupleConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- Status rval = Status::Accept;
- auto array = document_.as_array();
- size_t const n = std::min(cons.items.size(), array.size());
- for (size_t i = 0; i < n; ++i) {
- rval &= validate_subschema_on(cons.items[i], array[i], i);
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::UniqueItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- if constexpr (std::totally_ordered<A>) {
- std::map<A, size_t> cache;
- size_t index = 0;
- for (A const & elem : document_.as_array()) {
- if (auto [it, created] = cache.emplace(elem, index); not created) {
- return note(Status::Reject, "items ", it->second, " and ", index, " are equal");
- }
- ++index;
- }
- } else {
- auto array = document_.as_array();
- for (size_t i = 0; i < array.size(); ++i) {
- for (size_t j = i + 1; j < array.size(); ++j) {
- if (array[i].equals(array[j], true)) {
- return note(Status::Reject, "items ", i, " and ", j, " are equal");
- }
- }
- }
- }
- return note(Status::Accept, "all array items are unique");
- }
- Status visit(constraint::AdditionalPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- auto matches_any_pattern = [this, &cons](std::string const & key) {
- for (auto & pattern : cons.patterns) {
- RE const & regex = regex_cache_.try_emplace(pattern, pattern).first->second;
- if (regex.search(key)) {
- return true;
- }
- }
- return false;
- };
- Status rval = Status::Accept;
- for (auto const & [key, elem] : document_.as_object()) {
- if (not cons.properties.contains(key) && not matches_any_pattern(key)) {
- rval &= validate_subschema_on(cons.subschema, elem, key);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::DependenciesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- auto object = document_.as_object();
- Status rval = Status::Accept;
- for (auto const & [key, subschema] : cons.subschemas) {
- if (not object.contains(key)) {
- continue;
- }
- rval &= validate_subschema(subschema, key);
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- for (auto [key, required] : cons.required) {
- if (not object.contains(key)) {
- continue;
- }
- for (auto const & [key, _] : object) {
- required.erase(key);
- }
- rval &= required.empty();
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::MaxPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- if (size_t size = document_.object_size(); size > cons.value) {
- return note(Status::Reject, "object of size ", size, " is >", cons.value);
- } else {
- return note(Status::Accept, "object of size ", size, " is <=", cons.value);
- }
- }
- Status visit(constraint::MinPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- if (size_t size = document_.object_size(); size > cons.value) {
- return note(Status::Reject, "object of size ", size, " is <", cons.value);
- } else {
- return note(Status::Accept, "object of size ", size, " is >=", cons.value);
- }
- }
- Status visit(constraint::PatternPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- Status rval = Status::Accept;
- for (auto const & [pattern, subschema] : cons.properties) {
- RE const & regex = regex_cache_.try_emplace(pattern, pattern).first->second;
- for (auto const & [key, elem] : document_.as_object()) {
- if (regex.search(key)) {
- rval &= validate_subschema_on(subschema, elem, key);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- }
- return rval;
- }
- Status visit(constraint::PropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- Status rval = Status::Accept;
- auto object = document_.as_object();
- if constexpr (MutableAdapter<A>) {
- for (auto const & [key, subschema] : cons.properties) {
- auto const * default_value = subschema->default_value();
- if (default_value && not object.contains(key)) {
- object.assign(key, *default_value);
- }
- }
- }
- for (auto const & [key, elem] : object) {
- if (auto it = cons.properties.find(key); it != cons.properties.end()) {
- rval &= validate_subschema_on(it->second, elem, key);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::PropertyNamesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- Status rval = Status::Accept;
- for (auto const & [key, _] : document_.as_object()) {
- // TODO(samjaffe): Should we prefer a std::string adapter like valijson?
- typename A::value_type key_json{key};
- rval &= validate_subschema_on(cons.key_schema, A(key_json), std::string("$$key"));
- }
- return rval;
- }
- Status visit(constraint::RequiredConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- auto required = cons.properties;
- for (auto const & [key, _] : document_.as_object()) {
- required.erase(key);
- }
- if (required.empty()) {
- return note(Status::Accept, "contains all required properties ", cons.properties);
- }
- return note(Status::Reject, "missing required properties ", required);
- }
- Status visit(constraint::UnevaluatedItemsConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Array);
- if (not visited_) {
- return Status::Reject;
- }
- Status rval = Status::Accept;
- auto array = document_.as_array();
- for (size_t i = 0; i < array.size(); ++i) {
- if (not VISITED(size_t).contains(i)) {
- rval &= validate_subschema_on(cons.subschema, array[i], i);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status visit(constraint::UnevaluatedPropertiesConstraint const & cons) const {
- NOOP_UNLESS_TYPE(Object);
- if (not visited_) {
- return Status::Reject;
- }
- Status rval = Status::Accept;
- for (auto const & [key, elem] : document_.as_object()) {
- if (not VISITED(std::string).contains(key)) {
- rval &= validate_subschema_on(cons.subschema, elem, key);
- }
- BREAK_EARLY_IF_NO_RESULT_TREE();
- }
- return rval;
- }
- Status validate() {
- if (std::optional<std::string> const & reject = schema_->rejects_all()) {
- annotate(*reject);
- return Status::Reject;
- }
- if (schema_->accepts_all()) {
- // An accept-all schema is not No-Op for the purpose of unevaluated*
- return Status::Accept;
- }
- VisitedAnnotation annotate;
- if (schema_->requires_result_context() and not visited_) {
- visited_ = &annotate;
- }
- Status rval = Status::Noop;
- if (std::optional<schema::Node const *> ref = schema_->reference_schema()) {
- rval = validate_subschema(*ref, "$ref");
- }
- detail::Pointer const current_schema = schema_path_;
- for (auto const & [key, p_constraint] : schema_->constraints()) {
- BREAK_EARLY_IF_NO_RESULT_TREE();
- schema_path_ = current_schema / key;
- rval &= p_constraint->accept(*this);
- }
- for (auto const & [key, p_constraint] : schema_->post_constraints()) {
- BREAK_EARLY_IF_NO_RESULT_TREE();
- schema_path_ = current_schema / key;
- rval &= p_constraint->accept(*this);
- }
- return rval;
- }
- private:
- template <typename... Args> void annotate(Args &&... args) const {
- if (not result_) {
- return;
- }
- std::stringstream ss;
- using ::jvalidate::operator<<;
- [[maybe_unused]] int _[] = {(ss << std::forward<Args>(args), 0)...};
- result_->annotate(where_, schema_path_, ss.str());
- }
- template <typename... Args> Status note(Status stat, Args &&... args) const {
- switch (tracking_) {
- case StoreResults::ForAnything:
- if (stat != Status::Noop) {
- annotate(std::forward<Args>(args)...);
- }
- break;
- case StoreResults::ForValid:
- if (stat == Status::Accept) {
- annotate(std::forward<Args>(args)...);
- }
- break;
- case StoreResults::ForInvalid:
- if (stat == Status::Reject) {
- annotate(std::forward<Args>(args)...);
- }
- break;
- }
- return stat;
- }
- template <typename C> static void merge_visited(C & to, C const & from) {
- to.insert(from.begin(), from.end());
- }
- template <typename... K>
- Status validate_subschema(constraint::Constraint::SubConstraint const & subschema,
- K const &... keys) const {
- if (schema::Node const * const * ppschema = std::get_if<0>(&subschema)) {
- return validate_subschema(*ppschema, keys...);
- } else {
- return std::get<1>(subschema)->accept(*this);
- }
- }
- template <typename... K>
- Status validate_subschema(schema::Node const * subschema, K const &... keys) const {
- VisitedAnnotation annotate;
- ValidationVisitor next = *this;
- ((next.schema_path_ /= keys), ...);
- std::tie(next.schema_, next.visited_) =
- std::forward_as_tuple(subschema, visited_ ? &annotate : nullptr);
- Status rval = next.validate();
- if (rval == Status::Accept and visited_) {
- merge_visited(std::get<0>(*visited_), std::get<0>(annotate));
- merge_visited(std::get<1>(*visited_), std::get<1>(annotate));
- }
- return rval;
- }
- template <typename K>
- Status validate_subschema_on(schema::Node const * subschema, A const & document,
- K const & key) const {
- ValidationResult result;
- ValidationVisitor next = *this;
- next.where_ /= key;
- std::tie(next.document_, next.schema_, next.result_, next.visited_) =
- std::forward_as_tuple(document, subschema, result_ ? &result : nullptr, nullptr);
- auto status = next.validate();
- if (status == Status::Accept and visited_) {
- VISITED(K).insert(key);
- }
- if (status == Status::Reject and result_) {
- result_->annotate(std::move(result));
- }
- return status;
- }
- };
- }
|