validation_visitor.h 32 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845
  1. #pragma once
  2. #include <algorithm>
  3. #include <tuple>
  4. #include <type_traits>
  5. #include <vector>
  6. #include <jvalidate/compat/enumerate.h>
  7. #include <jvalidate/constraint/array_constraint.h>
  8. #include <jvalidate/constraint/general_constraint.h>
  9. #include <jvalidate/constraint/number_constraint.h>
  10. #include <jvalidate/constraint/object_constraint.h>
  11. #include <jvalidate/constraint/string_constraint.h>
  12. #include <jvalidate/detail/expect.h>
  13. #include <jvalidate/detail/iostream.h>
  14. #include <jvalidate/detail/number.h>
  15. #include <jvalidate/detail/pointer.h>
  16. #include <jvalidate/detail/scoped_state.h>
  17. #include <jvalidate/detail/string_adapter.h>
  18. #include <jvalidate/format.h>
  19. #include <jvalidate/forward.h>
  20. #include <jvalidate/schema.h>
  21. #include <jvalidate/status.h>
  22. #include <jvalidate/validation_config.h>
  23. #include <jvalidate/validation_result.h>
  24. #define VISITED(type) std::get<std::unordered_set<type>>(*visited_)
  25. #define VALIDATE_SUBSCHEMA_AND_MARK_LOCAL_VISIT(subschema, subinstance, path, local_visited, ...) \
  26. do { \
  27. Status const partial = \
  28. validate_subschema_on(subschema, subinstance, path __VA_OPT__(, ) __VA_ARGS__); \
  29. rval &= partial; \
  30. if (result_ and partial != Status::Noop) { \
  31. local_visited.insert(local_visited.end(), path); \
  32. } \
  33. } while (false)
  34. #define NOOP_UNLESS_TYPE(etype) RETURN_UNLESS(adapter::Type::etype == document.type(), Status::Noop)
  35. #define BREAK_EARLY_IF_NO_RESULT_TREE() \
  36. do { \
  37. if (rval == Status::Reject and not result_ and not visited_) { \
  38. break; \
  39. } \
  40. } while (false)
  41. namespace jvalidate {
  42. template <RegexEngine RE, typename ExtensionVisitor> class ValidationVisitor {
  43. private:
  44. JVALIDATE_TRIBOOL_TYPE(StoreResults, ForValid, ForInvalid, ForAnything);
  45. using VisitedAnnotation = std::tuple<std::unordered_set<size_t>, std::unordered_set<std::string>>;
  46. friend ExtensionVisitor;
  47. private:
  48. detail::Pointer where_;
  49. detail::Pointer schema_path_;
  50. schema::Node const * schema_;
  51. ValidationResult * result_;
  52. ValidationConfig const & cfg_;
  53. ExtensionVisitor extension_;
  54. RE & regex_;
  55. mutable VisitedAnnotation * visited_ = nullptr;
  56. mutable StoreResults tracking_ = StoreResults::ForInvalid;
  57. public:
  58. /**
  59. * @brief Construct a new ValidationVisitor
  60. *
  61. * @param schema The parsed JSON Schema
  62. * @param cfg General configuration settings for how the run is executed
  63. * @param regex A cache of string regular expressions to compiled
  64. * regular expressions
  65. * @param[optional] extension A special visitor for extension constraints.
  66. * @param[optional] result A cache of result/annotation info for the user to
  67. * receive a detailed summary of why a document is supported/unsupported.
  68. */
  69. ValidationVisitor(schema::Node const & schema, ValidationConfig const & cfg, RE & regex,
  70. ExtensionVisitor extension, ValidationResult * result)
  71. : schema_(&schema), result_(result), cfg_(cfg), extension_(extension), regex_(regex) {}
  72. Status visit(constraint::ExtensionConstraint const & cons, Adapter auto const & document) const {
  73. // Because we don't provide any contract constraint on our ExtensionVisitor,
  74. // we instead defer it to here where we validate that the extension can be
  75. // validated given the input document.
  76. // This covers a case where we write the extension around a specific adapter
  77. // instead of generically.
  78. if constexpr (std::is_invocable_r_v<Status, ExtensionVisitor, decltype(cons),
  79. decltype(document), ValidationVisitor const &>) {
  80. return extension_(cons, document, *this);
  81. }
  82. annotate("unsupported extension");
  83. return Status::Noop;
  84. }
  85. Status visit(constraint::TypeConstraint const & cons, Adapter auto const & document) const {
  86. adapter::Type const type = document.type();
  87. for (adapter::Type const accept : cons.types) {
  88. if (type == accept) { // Simple case, types are equal
  89. return result(Status::Accept, type, " is in types [", cons.types, "]");
  90. }
  91. if (accept == adapter::Type::Number && type == adapter::Type::Integer) {
  92. // Number is a super-type of Integer, therefore all Integer values are
  93. // accepted by a `"type": "number"` schema.
  94. return result(Status::Accept, type, " is in types [", cons.types, "]");
  95. }
  96. if (accept == adapter::Type::Integer && type == adapter::Type::Number &&
  97. detail::is_json_integer(document.as_number())) {
  98. // Since the JSON specification does not distinguish between Number
  99. // and Integer, but JSON Schema does, we need to check that the number
  100. // is a whole integer that is representable within the system (64-bit).
  101. return result(Status::Accept, type, " is in types [", cons.types, "]");
  102. }
  103. }
  104. return result(Status::Reject, type, " is not in types [", cons.types, "]");
  105. }
  106. Status visit(constraint::ConstConstraint const & cons, Adapter auto const & document) const {
  107. auto is_equal = [this, &document](auto const & frozen) {
  108. return document.equals(frozen, cfg_.strict_equality);
  109. };
  110. if (cons.value->apply(is_equal)) {
  111. return result(Status::Accept, "matches value");
  112. }
  113. return result(Status::Reject, cons.value, " was expected");
  114. }
  115. Status visit(constraint::EnumConstraint const & cons, Adapter auto const & document) const {
  116. auto is_equal = [this, &document](auto const & frozen) {
  117. return document.equals(frozen, cfg_.strict_equality);
  118. };
  119. for (auto const & [index, option] : detail::enumerate(cons.enumeration)) {
  120. if (option->apply(is_equal)) {
  121. return result(Status::Accept, index);
  122. }
  123. }
  124. return result(Status::Reject, document, " value is not one of ", cons.enumeration);
  125. }
  126. Status visit(constraint::AllOfConstraint const & cons, Adapter auto const & document) const {
  127. Status rval = Status::Accept;
  128. std::set<size_t> unmatched;
  129. for (auto const & [index, subschema] : detail::enumerate(cons.children)) {
  130. if (auto stat = validate_subschema(subschema, document, index); stat == Status::Reject) {
  131. rval = Status::Reject;
  132. unmatched.insert(index);
  133. }
  134. BREAK_EARLY_IF_NO_RESULT_TREE();
  135. }
  136. if (rval == Status::Reject) {
  137. return result(rval, "does not validate subschemas ", unmatched);
  138. }
  139. return result(rval, "validates all subschemas");
  140. }
  141. Status visit(constraint::AnyOfConstraint const & cons, Adapter auto const & document) const {
  142. std::optional<size_t> first_validated;
  143. for (auto const & [index, subschema] : detail::enumerate(cons.children)) {
  144. if (validate_subschema(subschema, document, index)) {
  145. // This technically will produce different results when we're tracking
  146. // visited nodes, but in practice it doesn't actually matter which
  147. // subschema index we record in the annotation.
  148. first_validated = index;
  149. }
  150. if (not visited_ && first_validated.has_value()) {
  151. break;
  152. }
  153. }
  154. if (first_validated.has_value()) {
  155. return result(Status::Accept, "validates subschema ", *first_validated);
  156. }
  157. return result(Status::Reject, "validates none of the subschemas");
  158. }
  159. Status visit(constraint::OneOfConstraint const & cons, Adapter auto const & document) const {
  160. std::set<size_t> matches;
  161. for (auto const & [index, subschema] : detail::enumerate(cons.children)) {
  162. scoped_state(tracking_, StoreResults::ForAnything);
  163. if (validate_subschema(subschema, document, index)) {
  164. matches.insert(index);
  165. }
  166. }
  167. if (matches.size() == 1) {
  168. return result(Status::Accept, "validates subschema ", *matches.begin());
  169. }
  170. return result(Status::Reject, "validates multiple subschemas ", matches);
  171. }
  172. Status visit(constraint::NotConstraint const & cons, Adapter auto const & document) const {
  173. scoped_state(visited_, nullptr);
  174. scoped_state(tracking_, !tracking_);
  175. bool const rejected = validate_subschema(cons.child, document) == Status::Reject;
  176. return rejected;
  177. }
  178. Status visit(constraint::ConditionalConstraint const & cons,
  179. Adapter auto const & document) const {
  180. Status const if_true = [this, &cons, &document]() {
  181. scoped_state(tracking_, StoreResults::ForAnything);
  182. return validate_subschema(cons.if_constraint, document);
  183. }();
  184. annotate(if_true ? "valid" : "invalid");
  185. if (if_true) {
  186. return validate_subschema(cons.then_constraint, document, detail::parent, "then");
  187. }
  188. return validate_subschema(cons.else_constraint, document, detail::parent, "else");
  189. }
  190. Status visit(constraint::MaximumConstraint const & cons, Adapter auto const & document) const {
  191. switch (document.type()) {
  192. case adapter::Type::Integer:
  193. if (int64_t value = document.as_integer(); not cons(value)) {
  194. return result(Status::Reject, value, cons.exclusive ? " >= " : " > ", cons.value);
  195. } else {
  196. return result(Status::Accept, value, cons.exclusive ? " < " : " <= ", cons.value);
  197. }
  198. case adapter::Type::Number:
  199. if (double value = document.as_number(); not cons(value)) {
  200. return result(Status::Reject, value, cons.exclusive ? " >= " : " > ", cons.value);
  201. } else {
  202. return result(Status::Accept, value, cons.exclusive ? " < " : " <= ", cons.value);
  203. }
  204. default:
  205. return Status::Noop;
  206. }
  207. }
  208. Status visit(constraint::MinimumConstraint const & cons, Adapter auto const & document) const {
  209. switch (document.type()) {
  210. case adapter::Type::Integer:
  211. if (int64_t value = document.as_integer(); not cons(value)) {
  212. return result(Status::Reject, value, cons.exclusive ? " <= " : " < ", cons.value);
  213. } else {
  214. return result(Status::Accept, value, cons.exclusive ? " > " : " >= ", cons.value);
  215. }
  216. case adapter::Type::Number:
  217. if (double value = document.as_number(); not cons(value)) {
  218. return result(Status::Reject, value, cons.exclusive ? " <= " : " < ", cons.value);
  219. } else {
  220. return result(Status::Accept, value, cons.exclusive ? " > " : " >= ", cons.value);
  221. }
  222. default:
  223. return Status::Noop;
  224. }
  225. }
  226. Status visit(constraint::MultipleOfConstraint const & cons, Adapter auto const & document) const {
  227. adapter::Type const type = document.type();
  228. RETURN_UNLESS(type == adapter::Type::Number || type == adapter::Type::Integer, Status::Noop);
  229. if (double value = document.as_number(); not cons(value)) {
  230. return result(Status::Reject, value, " is not a multiple of ", cons.value);
  231. } else {
  232. return result(Status::Accept, value, " is a multiple of ", cons.value);
  233. }
  234. }
  235. Status visit(constraint::MaxLengthConstraint const & cons, Adapter auto const & document) const {
  236. NOOP_UNLESS_TYPE(String);
  237. std::string const str = document.as_string();
  238. if (int64_t len = detail::length_u32(str); len > cons.value) {
  239. return result(Status::Reject, "string of length ", len, " is >", cons.value);
  240. } else {
  241. return result(Status::Accept, "string of length ", len, " is <=", cons.value);
  242. }
  243. }
  244. Status visit(constraint::MinLengthConstraint const & cons, Adapter auto const & document) const {
  245. NOOP_UNLESS_TYPE(String);
  246. std::string const str = document.as_string();
  247. if (int64_t len = detail::length_u32(str); len < cons.value) {
  248. return result(Status::Reject, "string of length ", len, " is <", cons.value);
  249. } else {
  250. return result(Status::Accept, "string of length ", len, " is >=", cons.value);
  251. }
  252. }
  253. Status visit(constraint::PatternConstraint const & cons, Adapter auto const & document) const {
  254. NOOP_UNLESS_TYPE(String);
  255. std::string const str = document.as_string();
  256. if (regex_.search(cons.regex, str)) {
  257. return result(Status::Accept, "string matches pattern /", cons.regex, "/");
  258. }
  259. return result(Status::Reject, "string does not match pattern /", cons.regex, "/");
  260. }
  261. Status visit(constraint::FormatConstraint const & cons, Adapter auto const & document) const {
  262. // https://json-schema.org/draft/2020-12/json-schema-validation#name-defined-formats
  263. NOOP_UNLESS_TYPE(String);
  264. annotate(cons.format);
  265. if (not cfg_.validate_format && not cons.is_assertion) {
  266. // Don't both validating formats if we're not in assertion mode
  267. // Assertion mode is specified either by using the appropriate "$vocab"
  268. // meta-schema or by requesting it in the ValidationConfig.
  269. return true; // TODO: I think this can be made into Noop
  270. }
  271. switch (FormatValidator(&RE::is_regex)(cons.format, document.as_string())) {
  272. case FormatValidator::Status::Unimplemented:
  273. return result(Status::Reject, "unimplemented format '", cons.format, "'");
  274. case FormatValidator::Status::Invalid:
  275. return result(Status::Reject, "does not match format '", cons.format, "'");
  276. case FormatValidator::Status::Unknown:
  277. case FormatValidator::Status::Valid:
  278. return result(Status::Accept, "matches format '", cons.format, "'");
  279. }
  280. }
  281. Status visit(constraint::AdditionalItemsConstraint const & cons,
  282. Adapter auto const & document) const {
  283. NOOP_UNLESS_TYPE(Array);
  284. auto array = document.as_array();
  285. Status rval = Status::Accept;
  286. std::vector<size_t> items;
  287. for (size_t i = cons.applies_after_nth; i < array.size(); ++i) {
  288. VALIDATE_SUBSCHEMA_AND_MARK_LOCAL_VISIT(cons.subschema, array[i], i, items);
  289. BREAK_EARLY_IF_NO_RESULT_TREE();
  290. }
  291. annotate_list(items);
  292. return rval;
  293. }
  294. Status visit(constraint::ContainsConstraint const & cons, Adapter auto const & document) const {
  295. NOOP_UNLESS_TYPE(Array);
  296. auto array = document.as_array();
  297. size_t const minimum = cons.minimum.value_or(1);
  298. size_t const maximum = cons.maximum.value_or(array.size());
  299. size_t matches = 0;
  300. for (size_t i = 0; i < array.size(); ++i) {
  301. if (validate_subschema_on(cons.subschema, array[i], i)) {
  302. ++matches;
  303. }
  304. }
  305. if (matches < minimum) {
  306. return result(Status::Reject, "array contains <", minimum, " matching items");
  307. }
  308. if (matches > maximum) {
  309. return result(Status::Reject, "array contains >", maximum, " matching items");
  310. }
  311. return result(Status::Accept, "array contains ", matches, " matching items");
  312. }
  313. Status visit(constraint::MaxItemsConstraint const & cons, Adapter auto const & document) const {
  314. NOOP_UNLESS_TYPE(Array);
  315. if (size_t size = document.array_size(); size > cons.value) {
  316. return result(Status::Reject, "array of size ", size, " is >", cons.value);
  317. } else {
  318. return result(Status::Accept, "array of size ", size, " is <=", cons.value);
  319. }
  320. }
  321. Status visit(constraint::MinItemsConstraint const & cons, Adapter auto const & document) const {
  322. NOOP_UNLESS_TYPE(Array);
  323. if (size_t size = document.array_size(); size < cons.value) {
  324. return result(Status::Reject, "array of size ", size, " is <", cons.value);
  325. } else {
  326. return result(Status::Accept, "array of size ", size, " is >=", cons.value);
  327. }
  328. }
  329. Status visit(constraint::TupleConstraint const & cons, Adapter auto const & document) const {
  330. NOOP_UNLESS_TYPE(Array);
  331. Status rval = Status::Accept;
  332. std::vector<size_t> items;
  333. for (auto const & [index, item] : detail::enumerate(document.as_array())) {
  334. if (index >= cons.items.size()) {
  335. break;
  336. }
  337. VALIDATE_SUBSCHEMA_AND_MARK_LOCAL_VISIT(cons.items[index], item, index, items);
  338. BREAK_EARLY_IF_NO_RESULT_TREE();
  339. }
  340. annotate_list(items);
  341. return rval;
  342. }
  343. template <Adapter A>
  344. Status visit(constraint::UniqueItemsConstraint const & cons, A const & document) const {
  345. NOOP_UNLESS_TYPE(Array);
  346. if constexpr (std::totally_ordered<A>) {
  347. // If the adapter defines comparison operators, then it becomes possible
  348. // to compute uniqueness in O(n*log(n)) checks.
  349. std::map<A, size_t> cache;
  350. for (auto const & [index, elem] : detail::enumerate(document.as_array())) {
  351. if (auto [it, created] = cache.emplace(elem, index); not created) {
  352. return result(Status::Reject, "items ", it->second, " and ", index, " are equal");
  353. }
  354. }
  355. } else {
  356. // Otherwise, we need to run an O(n^2) triangular array search comparing
  357. // equality for each element. This still guarantees that each element is
  358. // compared against each other element no more than once.
  359. auto array = document.as_array();
  360. for (size_t i = 0; i < array.size(); ++i) {
  361. for (size_t j = i + 1; j < array.size(); ++j) {
  362. if (array[i].equals(array[j], true)) {
  363. return result(Status::Reject, "items ", i, " and ", j, " are equal");
  364. }
  365. }
  366. }
  367. }
  368. return result(Status::Accept, "all array items are unique");
  369. }
  370. Status visit(constraint::AdditionalPropertiesConstraint const & cons,
  371. Adapter auto const & document) const {
  372. NOOP_UNLESS_TYPE(Object);
  373. auto matches_any_pattern = [this, &cons](std::string const & key) {
  374. return std::ranges::any_of(cons.patterns, [this, &key](auto const & pattern) {
  375. return regex_.search(pattern, key);
  376. });
  377. };
  378. Status rval = Status::Accept;
  379. std::vector<std::string> properties;
  380. for (auto const & [key, elem] : document.as_object()) {
  381. if (not cons.properties.contains(key) && not matches_any_pattern(key)) {
  382. VALIDATE_SUBSCHEMA_AND_MARK_LOCAL_VISIT(cons.subschema, elem, key, properties);
  383. }
  384. BREAK_EARLY_IF_NO_RESULT_TREE();
  385. }
  386. annotate_list(properties);
  387. return rval;
  388. }
  389. Status visit(constraint::DependenciesConstraint const & cons,
  390. Adapter auto const & document) const {
  391. NOOP_UNLESS_TYPE(Object);
  392. auto object = document.as_object();
  393. Status rval = Status::Accept;
  394. for (auto const & [key, subschema] : cons.subschemas) {
  395. if (not object.contains(key)) {
  396. continue;
  397. }
  398. rval &= validate_subschema(subschema, document, key);
  399. BREAK_EARLY_IF_NO_RESULT_TREE();
  400. }
  401. for (auto [key, required] : cons.required) {
  402. if (not object.contains(key)) {
  403. continue;
  404. }
  405. for (auto const & [key, _] : object) {
  406. required.erase(key);
  407. }
  408. rval &= required.empty();
  409. BREAK_EARLY_IF_NO_RESULT_TREE();
  410. }
  411. return rval;
  412. }
  413. Status visit(constraint::MaxPropertiesConstraint const & cons,
  414. Adapter auto const & document) const {
  415. NOOP_UNLESS_TYPE(Object);
  416. if (size_t size = document.object_size(); size > cons.value) {
  417. return result(Status::Reject, "object of size ", size, " is >", cons.value);
  418. } else {
  419. return result(Status::Accept, "object of size ", size, " is <=", cons.value);
  420. }
  421. }
  422. Status visit(constraint::MinPropertiesConstraint const & cons,
  423. Adapter auto const & document) const {
  424. NOOP_UNLESS_TYPE(Object);
  425. if (size_t size = document.object_size(); size < cons.value) {
  426. return result(Status::Reject, "object of size ", size, " is <", cons.value);
  427. } else {
  428. return result(Status::Accept, "object of size ", size, " is >=", cons.value);
  429. }
  430. }
  431. Status visit(constraint::PatternPropertiesConstraint const & cons,
  432. Adapter auto const & document) const {
  433. NOOP_UNLESS_TYPE(Object);
  434. std::vector<std::string> properties;
  435. Status rval = Status::Accept;
  436. for (auto const & [pattern, subschema] : cons.properties) {
  437. for (auto const & [key, elem] : document.as_object()) {
  438. if (not regex_.search(pattern, key)) {
  439. continue;
  440. }
  441. VALIDATE_SUBSCHEMA_AND_MARK_LOCAL_VISIT(subschema, elem, key, properties);
  442. BREAK_EARLY_IF_NO_RESULT_TREE();
  443. }
  444. }
  445. annotate_list(properties);
  446. return rval;
  447. }
  448. template <Adapter A>
  449. Status visit(constraint::PropertiesConstraint const & cons, A const & document) const {
  450. NOOP_UNLESS_TYPE(Object);
  451. Status rval = Status::Accept;
  452. auto object = document.as_object();
  453. if constexpr (MutableAdapter<A>) {
  454. // Special Rule - if the adapter is of a mutable json document (wraps a
  455. // non-const reference and exposes the assign function) we will process
  456. // the "default" annotation will be applied.
  457. // https://json-schema.org/draft/2020-12/json-schema-validation#section-9.2
  458. //
  459. // Although the JSON Schema draft only says the the default value ought be
  460. // valid against the schema, this implementation will assure that it is
  461. // valid against this PropertiesConstraint, and any other constraints that
  462. // are run after this one.
  463. for (auto const & [key, subschema] : cons.properties) {
  464. auto const * default_value = subschema->default_value();
  465. if (default_value && not object.contains(key)) {
  466. object.assign(key, *default_value);
  467. }
  468. }
  469. }
  470. std::vector<std::string> properties;
  471. for (auto const & [key, elem] : object) {
  472. if (auto it = cons.properties.find(key); it != cons.properties.end()) {
  473. VALIDATE_SUBSCHEMA_AND_MARK_LOCAL_VISIT(it->second, elem, key, properties, key);
  474. }
  475. BREAK_EARLY_IF_NO_RESULT_TREE();
  476. }
  477. annotate_list(properties);
  478. return rval;
  479. }
  480. template <Adapter A>
  481. Status visit(constraint::PropertyNamesConstraint const & cons, A const & document) const {
  482. NOOP_UNLESS_TYPE(Object);
  483. Status rval = Status::Accept;
  484. for (auto const & [key, _] : document.as_object()) {
  485. rval &=
  486. validate_subschema_on(cons.key_schema, detail::StringAdapter(key), std::string("$$key"));
  487. }
  488. return rval;
  489. }
  490. Status visit(constraint::RequiredConstraint const & cons, Adapter auto const & document) const {
  491. NOOP_UNLESS_TYPE(Object);
  492. auto required = cons.properties;
  493. for (auto const & [key, _] : document.as_object()) {
  494. required.erase(key);
  495. }
  496. if (required.empty()) {
  497. return result(Status::Accept, "contains all required properties ", cons.properties);
  498. }
  499. return result(Status::Reject, "missing required properties ", required);
  500. }
  501. Status visit(constraint::UnevaluatedItemsConstraint const & cons,
  502. Adapter auto const & document) const {
  503. NOOP_UNLESS_TYPE(Array);
  504. if (not visited_) {
  505. return Status::Reject;
  506. }
  507. Status rval = Status::Accept;
  508. std::vector<size_t> items;
  509. for (auto const & [index, item] : detail::enumerate(document.as_array())) {
  510. if (not VISITED(size_t).contains(index)) {
  511. VALIDATE_SUBSCHEMA_AND_MARK_LOCAL_VISIT(cons.subschema, item, index, items);
  512. }
  513. BREAK_EARLY_IF_NO_RESULT_TREE();
  514. }
  515. annotate_list(items);
  516. return rval;
  517. }
  518. Status visit(constraint::UnevaluatedPropertiesConstraint const & cons,
  519. Adapter auto const & document) const {
  520. NOOP_UNLESS_TYPE(Object);
  521. if (not visited_) {
  522. return Status::Reject;
  523. }
  524. Status rval = Status::Accept;
  525. std::vector<std::string> properties;
  526. for (auto const & [key, elem] : document.as_object()) {
  527. if (not VISITED(std::string).contains(key)) {
  528. VALIDATE_SUBSCHEMA_AND_MARK_LOCAL_VISIT(cons.subschema, elem, key, properties);
  529. }
  530. BREAK_EARLY_IF_NO_RESULT_TREE();
  531. }
  532. annotate_list(properties);
  533. return rval;
  534. }
  535. /**
  536. * @brief The main entry point into the validator. Validates the provided
  537. * document according to the schema.
  538. */
  539. Status validate(Adapter auto const & document) {
  540. // Step 1) Check if this is an always-false schema. Sometimes, this will
  541. // have a custom message.
  542. if (std::optional<std::string> const & reject = schema_->rejects_all()) {
  543. if (should_annotate(Status::Reject)) {
  544. // This will only be run if we are interested in why something is
  545. // rejected. For example - `{ "not": false }` doesn't produce a
  546. // meaningful annotation...
  547. result_->error(where_, schema_path_, "", *reject);
  548. }
  549. // ...We do always record the result if a result object is present.
  550. (result_ ? result_->valid(where_, schema_path_, false) : void());
  551. return Status::Reject;
  552. }
  553. if (schema_->accepts_all()) {
  554. // An accept-all schema is not No-Op for the purpose of unevaluated*
  555. (result_ ? result_->valid(where_, schema_path_, true) : void());
  556. return Status::Accept;
  557. }
  558. // Begin tracking evaluations for unevaluated* keywords. The annotation
  559. // object is passed down from parent visitor to child visitor to allow all
  560. // schemas to mark whether they visited a certain item or property.
  561. VisitedAnnotation annotate;
  562. if (schema_->requires_result_context() and not visited_) {
  563. visited_ = &annotate;
  564. }
  565. Status rval = Status::Noop;
  566. // Before Draft2019_09, reference schemas could not coexist with other
  567. // constraints. This is enforced in the parsing of the schema, rather than
  568. // during validation {@see jvalidate::schema::Node::construct}.
  569. if (std::optional<schema::Node const *> ref = schema_->reference_schema()) {
  570. // TODO: Investigate why this seems to produce .../$ref/$ref pointers
  571. rval = validate_subschema(*ref, document, "$ref");
  572. }
  573. if (result_ && !schema_->description().empty()) {
  574. result_->annotate(where_, schema_path_, "description", schema_->description());
  575. }
  576. detail::Pointer const current_schema = schema_path_;
  577. for (auto const & [key, p_constraint] : schema_->constraints()) {
  578. BREAK_EARLY_IF_NO_RESULT_TREE();
  579. schema_path_ = current_schema / key;
  580. rval &= std::visit([this, &document](auto & c) { return this->visit(c, document); },
  581. *p_constraint);
  582. }
  583. // Post Constraints represent the unevaluatedItems and unevaluatedProperties
  584. // keywords.
  585. for (auto const & [key, p_constraint] : schema_->post_constraints()) {
  586. BREAK_EARLY_IF_NO_RESULT_TREE();
  587. schema_path_ = current_schema / key;
  588. rval &= std::visit([this, &document](auto & c) { return this->visit(c, document); },
  589. *p_constraint);
  590. }
  591. (result_ ? result_->valid(where_, current_schema, static_cast<bool>(rval)) : void());
  592. return rval;
  593. }
  594. private:
  595. template <typename S>
  596. requires(std::is_constructible_v<std::string, S>)
  597. // Optimization to avoid running string-like objects through a
  598. // std::stringstream in fmtlist.
  599. static std::string fmt(S const & str) {
  600. return str;
  601. }
  602. // Format va_args into a single string to annotate or mark an error message
  603. static std::string fmt(auto const &... args) {
  604. std::stringstream ss;
  605. using ::jvalidate::operator<<;
  606. [[maybe_unused]] int _[] = {(ss << args, 0)...};
  607. return ss.str();
  608. }
  609. // Format an iterable argument into a vector of strings to annotate or mark
  610. // an error.
  611. static std::vector<std::string> fmtlist(auto const & arg) {
  612. std::vector<std::string> strs;
  613. for (auto const & elem : arg) {
  614. strs.push_back(fmt(elem));
  615. }
  616. return strs;
  617. }
  618. bool should_annotate(Status stat) const {
  619. if (not result_) {
  620. return false;
  621. }
  622. switch (*tracking_) {
  623. case StoreResults::ForAnything:
  624. return stat != Status::Noop;
  625. case StoreResults::ForValid:
  626. return stat == Status::Accept;
  627. case StoreResults::ForInvalid:
  628. return stat == Status::Reject;
  629. }
  630. }
  631. #define ANNOTATION_HELPER(name, ADD, FMT) \
  632. void name(auto const &... args) const { \
  633. if (not result_) { \
  634. /* do nothing if there's no result object to append to */ \
  635. } else if (schema_path_.empty()) { \
  636. result_->ADD(where_, schema_path_, "", FMT(args...)); \
  637. } else { \
  638. result_->ADD(where_, schema_path_.parent(), schema_path_.back(), FMT(args...)); \
  639. } \
  640. }
  641. ANNOTATION_HELPER(error, error, fmt)
  642. ANNOTATION_HELPER(annotate, annotate, fmt)
  643. ANNOTATION_HELPER(annotate_list, annotate, fmtlist)
  644. Status result(Status stat, auto const &... args) const {
  645. return (should_annotate(stat) ? error(args...) : void(), stat);
  646. }
  647. /**
  648. * @brief Walking function for entering a subschema.
  649. *
  650. * @param subschema The "subschema" being validated. This is either another
  651. * schema object (jvalidate::schema::Node), or a constraint.
  652. * @param keys... The path to this subschema, relative to the current schema
  653. * evaluation.
  654. *
  655. * @return The status of validating the current instance against the
  656. * subschema.
  657. */
  658. template <typename... K>
  659. Status validate_subschema(constraint::SubConstraint const & subschema,
  660. Adapter auto const & document, K const &... keys) const {
  661. if (schema::Node const * const * ppschema = std::get_if<0>(&subschema)) {
  662. return validate_subschema(*ppschema, document, keys...);
  663. } else {
  664. return std::visit([this, &document](auto & c) { return this->visit(c, document); },
  665. *std::get<1>(subschema));
  666. }
  667. }
  668. /**
  669. * @brief Walking function for entering a subschema. Creates a new validation
  670. * visitor in order to continue evaluation.
  671. *
  672. * @param subschema The subschema being validated.
  673. * @param keys... The path to this subschema, relative to the current schema
  674. * evaluation.
  675. *
  676. * @return The status of validating the current instance against the
  677. * subschema.
  678. */
  679. template <typename... K>
  680. Status validate_subschema(schema::Node const * subschema, Adapter auto const & document,
  681. K const &... keys) const {
  682. VisitedAnnotation annotate;
  683. ValidationVisitor next = *this;
  684. ((next.schema_path_ /= keys), ...);
  685. std::tie(next.schema_, next.visited_) =
  686. std::forward_as_tuple(subschema, visited_ ? &annotate : nullptr);
  687. Status rval = next.validate(document);
  688. // Only update the visited annotation of the current context if the
  689. // subschema validates as Accepted.
  690. if (rval == Status::Accept and visited_) {
  691. std::get<0>(*visited_).merge(std::get<0>(annotate));
  692. std::get<1>(*visited_).merge(std::get<1>(annotate));
  693. }
  694. return rval;
  695. }
  696. /**
  697. * @brief Walking function for entering a subschema and child document.
  698. * Creates a new validation visitor in order to continue evaluation.
  699. *
  700. * @param subschema The subschema being validated.
  701. * @param document The child document being evaluated.
  702. * @param key The path to this document instance.
  703. * @param schema_keys... The path to this subschema, relative to the current
  704. * schema evaluation.
  705. *
  706. * @return The status of validating the current instance against the
  707. * subschema.
  708. */
  709. template <typename K>
  710. Status validate_subschema_on(schema::Node const * subschema, Adapter auto const & document,
  711. K const & key, auto const &... schema_keys) const {
  712. ValidationResult result;
  713. ValidationVisitor next = *this;
  714. next.where_ /= key;
  715. ((next.schema_path_ /= schema_keys), ...);
  716. std::tie(next.schema_, next.result_, next.visited_) =
  717. std::forward_as_tuple(subschema, result_ ? &result : nullptr, nullptr);
  718. Status rval = next.validate(document);
  719. // Only update the visited annotation of the current context if the
  720. // subschema validates as Accepted.
  721. if (rval == Status::Accept and visited_) {
  722. VISITED(K).insert(key);
  723. }
  724. // Update the annotation/error content only if a failure is being reported,
  725. // or if we are in an "if" schema.
  726. if ((rval == Status::Reject or tracking_ == StoreResults::ForAnything) and result_) {
  727. result_->merge(std::move(result));
  728. }
  729. return rval;
  730. }
  731. };
  732. }