samtranslator/validator/validator.py (89 lines of code) (raw):

import json import os import re from pathlib import Path from typing import Any import jsonschema from samtranslator.internal.deprecation_control import deprecated from . import sam_schema class SamTemplateValidator: """ SAM function validation, on the deprecation path. """ UNICODE_TYPE_REGEX = re.compile("u('[^']+')") @deprecated() def __init__(self, schema=None) -> None: # type: ignore[no-untyped-def] """ Constructor Parameters ---------- schema_path : str, optional Path to a schema to use for validation, by default None, the default schema.json will be used """ if not schema: schema = self._read_json(sam_schema.SCHEMA_NEW_FILE) # Helps resolve the $Ref to external files # For cross platform resolving, we have to load the sub schemas into # a store and pass it to the Resolver. We cannot use the "file://" style # of referencing inside a "$ref" of a schema as this will lead to mixups # on Windows because of different path separator: \\ instead of / schema_store = {} definitions_dir = sam_schema.SCHEMA_DIR / "definitions" for sub_schema in os.listdir(definitions_dir): if sub_schema.endswith(".json"): with (definitions_dir / sub_schema).open(encoding="utf-8") as f: schema_content = f.read() schema_store[sub_schema] = json.loads(schema_content) resolver = jsonschema.RefResolver.from_schema(schema, store=schema_store) # type: ignore[no-untyped-call] SAMValidator = jsonschema.validators.extend( jsonschema.Draft7Validator, type_checker=jsonschema.Draft7Validator.TYPE_CHECKER.redefine_many( {"object": is_object, "intrinsic": is_intrinsic} ), ) self.validator = SAMValidator(schema, resolver=resolver) @staticmethod @deprecated() def validate(template_dict, schema=None): # type: ignore[no-untyped-def] """ Validates a SAM Template [DEPRECATED]: Instanciate this class and use the get_errors instead: validator = SamTemplateValidator() validator.get_errors(template_dict) Kept for backward compatibility Parameters ---------- template_dict : dict Template schema : dict, optional Schema content, defaults to the integrated schema Returns ------- str Validation errors separated by commas "," """ validator = SamTemplateValidator(schema) return ", ".join(validator.get_errors(template_dict)) @deprecated() def get_errors(self, template_dict): # type: ignore[no-untyped-def] """ Validates a SAM Template Parameters ---------- template_dict : dict Template to validate schema : str, optional Schema content, by default None Returns ------- list[str] List of validation errors if any, empty otherwise """ # Tree of Error objects # Each object can have a list of child errors in its Context attribute validation_errors = self.validator.iter_errors(template_dict) # Set of "[Path.To.Element] Error message" # To track error uniqueness, Dict instead of List, for speed errors_set = {} # type: ignore[var-annotated] for e in validation_errors: self._process_error(e, errors_set) # type: ignore[no-untyped-call] # To be consistent across python versions 2 and 3, we have to sort the final result # It seems that the validator is not receiving the properties in the same order between python 2 and 3 # It thus returns errors in a different order return sorted(errors_set.keys()) def _process_error(self, error, errors_set): # type: ignore[no-untyped-def] """ Processes the validation errors recursively error is actually a tree of errors Each error can have a list of child errors in its 'context' attribute Parameters ---------- error : Error Error at the head errors_set : Dict Set of formatted errors """ if error is None: return if not error.context: # We only display the leaves # Format the message with pseudo JSON Path: # [Path.To.Element] Error message error_path = ".".join([str(p) for p in error.absolute_path]) if error.absolute_path else "." error_content = f"[{error_path}] {self._cleanup_error_message(error)}" # type: ignore[no-untyped-call] if error_content not in errors_set: # We set the value to None as we don't use it errors_set[error_content] = None return for context_error in error.context: # Each "context" item is also a validation error self._process_error(context_error, errors_set) # type: ignore[no-untyped-call] def _cleanup_error_message(self, error): # type: ignore[no-untyped-def] """ Cleans an error message up to remove unecessary clutter or replace it with a more meaningful one Parameters ---------- error : Error Error message to clean Returns ------- str Cleaned message """ final_message = re.sub(self.UNICODE_TYPE_REGEX, r"\1", error.message) if final_message.endswith(" under any of the given schemas"): return "Is not valid" if final_message.startswith(("None is not of type ", "None is not one of ")): return "Must not be empty" if " does not match " in final_message and "patternError" in error.schema: return re.sub("does not match .+", error.schema.get("patternError"), final_message) return final_message def _read_json(self, filepath: Path) -> Any: """ Returns the content of a JSON file Parameters ---------- filepath : Path File path Returns ------- dict Dictionary representing the JSON content """ with filepath.open(encoding="utf-8") as fp: return json.load(fp) # Type definition redefinitions INTRINSIC_ATTR = { "Fn::And", "Fn::Base64", "Fn::Cidr", "Fn::Equals", "Fn::FindInMap", "Fn::GetAtt", "Fn::GetAZs", "Fn::If", "Fn::ImportValue", "Fn::Join", "Fn::Not", "Fn::Or", "Fn::Select", "Fn::Split", "Fn::Sub", "Fn::Transform", "Ref", } def is_object(checker, instance): # type: ignore[no-untyped-def] """ 'object' type definition Overloaded to exclude intrinsic functions Parameters ---------- checker : dict Checker instance : element Template element Returns ------- boolean True if an object, False otherwise """ return isinstance(instance, dict) and not has_intrinsic_attr(instance) # type: ignore[no-untyped-call] def is_intrinsic(checker, instance): # type: ignore[no-untyped-def] """ 'intrinsic' type definition Parameters ---------- checker : dict [description] instance : [type] [description] Returns ------- [type] [description] """ return isinstance(instance, dict) and has_intrinsic_attr(instance) # type: ignore[no-untyped-call] def has_intrinsic_attr(instance): # type: ignore[no-untyped-def] """ Returns a value indicating whether the instance has an intrinsic attribute Only one attribute which must be one of the intrinsics Parameters ---------- instance : dict Dictionary Returns ------- boolean True if only has one intrinsic attribute, False otherwise """ return len(instance) == 1 and next(iter(instance)) in INTRINSIC_ATTR