Source code for pain001.xml.validate_via_xsd
from functools import lru_cache
from io import StringIO
import xmlschema
from defusedxml import ElementTree as defused_et
from defusedxml.ElementTree import ParseError
@lru_cache(maxsize=16)
def _get_cached_schema(xsd_file_path: str) -> xmlschema.XMLSchema:
"""Return a cached XMLSchema instance for the given XSD file path."""
return xmlschema.XMLSchema(xsd_file_path)
# Copyright (C) 2023-2026 Sebastien Rousseau.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
# implied.
# See the License for the specific language governing permissions and
# limitations under the License.
[docs]
def validate_via_xsd(xml_file_path: str, xsd_file_path: str) -> bool:
"""
Validates an XML file against an XSD schema.
Args:
xml_file_path (str): Path to the XML file to validate.
xsd_file_path (str): Path to the XSD schema file.
Returns:
bool: True if the XML file is valid, False otherwise.
"""
# Load XML file into an ElementTree object using defusedxml for security.
try:
xml_tree = defused_et.parse(xml_file_path)
except (ParseError, OSError) as e:
print(f"Error parsing XML file: {e}")
return False
# Load XSD schema into an XMLSchema object (cached).
try:
xsd = _get_cached_schema(xsd_file_path)
except (xmlschema.XMLSchemaException, ParseError, OSError) as e:
print(f"Error loading XSD schema: {e}")
return False
# Validate XML file against XSD schema.
try:
xsd.validate(xml_tree)
return True
except xmlschema.XMLSchemaException as e:
print(f"Error validating XML: {e}")
return False
[docs]
def validate_xml_string_via_xsd(xml_content: str, xsd_file_path: str) -> bool:
"""
Validates an XML string against an XSD schema.
This function is ideal for serverless/API architectures where XML is
generated in-memory without writing to disk.
Args:
xml_content (str): XML content as a string.
xsd_file_path (str): Path to the XSD schema file.
Returns:
bool: True if the XML content is valid, False otherwise.
Examples:
>>> xml_str = '<?xml version="1.0"?><Document></Document>'
>>> xsd_path = "schema.xsd"
>>> validate_xml_string_via_xsd(xml_str, xsd_path) # doctest: +SKIP
True
"""
# Load XML string into an ElementTree object using defusedxml for security.
try:
xml_tree = defused_et.parse(StringIO(xml_content))
except (ParseError, OSError) as e:
print(f"Error parsing XML string: {e}")
return False
# Load XSD schema into an XMLSchema object (cached).
try:
xsd = _get_cached_schema(xsd_file_path)
except (xmlschema.XMLSchemaException, ParseError, OSError) as e:
print(f"Error loading XSD schema: {e}")
return False
# Validate XML against XSD schema.
try:
xsd.validate(xml_tree)
return True
except xmlschema.XMLSchemaException as e:
print(f"Error validating XML: {e}")
return False