pypa
diff --git a/‎setuptools-scm/testing_scm/test_integration.py‎
Lines changed: 1 addition & 1 deletion b/‎setuptools-scm/testing_scm/test_integration.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎vcs-versioning/src/vcs_versioning/_overrides.py‎
Lines changed: 109 additions & 70 deletions b/‎vcs-versioning/src/vcs_versioning/_overrides.py‎
Lines changed: 109 additions & 70 deletions
diff --git a/‎vcs-versioning/src/vcs_versioning/_toml.py‎
Lines changed: 74 additions & 6 deletions b/‎vcs-versioning/src/vcs_versioning/_toml.py‎
Lines changed: 74 additions & 6 deletions
@@ -237,7 +237,7 @@ def test_pretend_metadata_invalid_fields_filtered(
         version = wd.get_version()
         assert version == "1.0.0"
 
-    assert "Invalid metadata fields in pretend metadata" in caplog.text
+    assert "Invalid fields in TOML data" in caplog.text
     assert "invalid_field" in caplog.text
     assert "another_bad_field" in caplog.text
 
 
@@ -8,18 +8,79 @@
 
 import dataclasses
 import logging
+import os
+import sys
 from collections.abc import Mapping
+from datetime import date, datetime
 from difflib import get_close_matches
-from typing import Any
+from re import Pattern
+from typing import TYPE_CHECKING, Any, TypedDict, get_type_hints
 
 from packaging.utils import canonicalize_name
 
 from . import _config
+from . import _types as _t
 from . import _version_schemes as version
-from ._toml import load_toml_or_inline_map
+from ._version_cls import Version as _Version
+
+if TYPE_CHECKING:
+    pass
+
+if sys.version_info >= (3, 11):
+    pass
+else:
+    pass
 
 log = logging.getLogger(__name__)
 
+
+# TypedDict schemas for TOML data validation and type hints
+
+
+class PretendMetadataDict(TypedDict, total=False):
+    """Schema for ScmVersion metadata fields that can be overridden via environment.
+
+    All fields are optional since partial overrides are allowed.
+    """
+
+    tag: str | _Version
+    distance: int
+    node: str | None
+    dirty: bool
+    preformatted: bool
+    branch: str | None
+    node_date: date | None
+    time: datetime
+
+
+class ConfigOverridesDict(TypedDict, total=False):
+    """Schema for Configuration fields that can be overridden via environment.
+
+    All fields are optional since partial overrides are allowed.
+    """
+
+    # Configuration fields
+    root: _t.PathT
+    version_scheme: _t.VERSION_SCHEME
+    local_scheme: _t.VERSION_SCHEME
+    tag_regex: str | Pattern[str]
+    parentdir_prefix_version: str | None
+    fallback_version: str | None
+    fallback_root: _t.PathT
+    write_to: _t.PathT | None
+    write_to_template: str | None
+    version_file: _t.PathT | None
+    version_file_template: str | None
+    parse: Any  # ParseFunction - avoid circular import
+    git_describe_command: _t.CMD_TYPE | None  # deprecated but still supported
+    dist_name: str | None
+    version_cls: Any  # type[_Version] - avoid circular import
+    normalize: bool  # Used in from_data
+    search_parent_directories: bool
+    parent: _t.PathT | None
+    scm: dict[str, Any]  # Nested SCM configuration
+
+
 PRETEND_KEY = "SETUPTOOLS_SCM_PRETEND_VERSION"
 PRETEND_KEY_NAMED = PRETEND_KEY + "_FOR_{name}"
 PRETEND_METADATA_KEY = "SETUPTOOLS_SCM_PRETEND_METADATA"
@@ -90,7 +151,7 @@ def _find_close_env_var_matches(
 
 def _read_pretended_metadata_for(
     config: _config.Configuration,
-) -> dict[str, Any] | None:
+) -> PretendMetadataDict | None:
     """read overridden metadata from the environment
 
     tries ``SETUPTOOLS_SCM_PRETEND_METADATA``
@@ -99,8 +160,6 @@ def _read_pretended_metadata_for(
     Returns a dictionary with metadata field overrides like:
     {"node": "g1337beef", "distance": 4}
     """
-    import os
-
     from .overrides import EnvReader
 
     log.debug("dist name: %s", config.dist_name)
@@ -110,39 +169,15 @@ def _read_pretended_metadata_for(
         env=os.environ,
         dist_name=config.dist_name,
     )
-    pretended = reader.read("PRETEND_METADATA")
 
-    if pretended:
-        try:
-            metadata_overrides = load_toml_or_inline_map(pretended)
-            # Validate that only known ScmVersion fields are provided
-            valid_fields = {
-                "tag",
-                "distance",
-                "node",
-                "dirty",
-                "preformatted",
-                "branch",
-                "node_date",
-                "time",
-            }
-            invalid_fields = set(metadata_overrides.keys()) - valid_fields
-            if invalid_fields:
-                log.warning(
-                    "Invalid metadata fields in pretend metadata: %s. "
-                    "Valid fields are: %s",
-                    invalid_fields,
-                    valid_fields,
-                )
-                # Remove invalid fields but continue processing
-                for field in invalid_fields:
-                    metadata_overrides.pop(field)
-
-            return metadata_overrides or None
-        except Exception as e:
-            log.error("Failed to parse pretend metadata: %s", e)
-            return None
-    else:
+    try:
+        # Use schema validation during TOML parsing
+        metadata_overrides = reader.read_toml(
+            "PRETEND_METADATA", schema=PretendMetadataDict
+        )
+        return metadata_overrides or None
+    except Exception as e:
+        log.error("Failed to parse pretend metadata: %s", e)
         return None
 
 
@@ -177,36 +212,41 @@ def _apply_metadata_overrides(
 
     log.info("Applying metadata overrides: %s", metadata_overrides)
 
-    # Define type checks and field mappings
-    from datetime import date, datetime
-
-    field_specs: dict[str, tuple[type | tuple[type, type], str]] = {
-        "distance": (int, "int"),
-        "dirty": (bool, "bool"),
-        "preformatted": (bool, "bool"),
-        "node_date": (date, "date"),
-        "time": (datetime, "datetime"),
-        "node": ((str, type(None)), "str or None"),
-        "branch": ((str, type(None)), "str or None"),
-        # tag is special - can be multiple types, handled separately
-    }
-
-    # Apply each override individually using dataclasses.replace for type safety
+    # Get type hints from PretendMetadataDict for validation
+    field_types = get_type_hints(PretendMetadataDict)
+
+    # Apply each override individually using dataclasses.replace
     result = scm_version
 
     for field, value in metadata_overrides.items():
-        if field in field_specs:
-            expected_type, type_name = field_specs[field]
-            assert isinstance(value, expected_type), (
-                f"{field} must be {type_name}, got {type(value).__name__}: {value!r}"
-            )
-            result = dataclasses.replace(result, **{field: value})
-        elif field == "tag":
-            # tag can be Version, NonNormalizedVersion, or str - we'll let the assignment handle validation
-            result = dataclasses.replace(result, tag=value)
-        else:
-            # This shouldn't happen due to validation in _read_pretended_metadata_for
-            log.warning("Unknown field '%s' in metadata overrides", field)
+        # Validate field types using the TypedDict annotations
+        if field in field_types:
+            expected_type = field_types[field]
+            # Handle Optional/Union types (e.g., str | None)
+            if hasattr(expected_type, "__args__"):
+                # Union type - check if value is instance of any of the types
+                valid = any(
+                    isinstance(value, t) if t is not type(None) else value is None
+                    for t in expected_type.__args__
+                )
+                if not valid:
+                    type_names = " | ".join(
+                        t.__name__ if t is not type(None) else "None"
+                        for t in expected_type.__args__
+                    )
+                    raise TypeError(
+                        f"Field '{field}' must be {type_names}, "
+                        f"got {type(value).__name__}: {value!r}"
+                    )
+            else:
+                # Simple type
+                if not isinstance(value, expected_type):
+                    raise TypeError(
+                        f"Field '{field}' must be {expected_type.__name__}, "
+                        f"got {type(value).__name__}: {value!r}"
+                    )
+
+        result = dataclasses.replace(result, **{field: value})  # type: ignore[arg-type]
 
     # Ensure config is preserved (should not be overridden)
     assert result.config is config, "Config must be preserved during metadata overrides"
@@ -222,8 +262,6 @@ def _read_pretended_version_for(
     tries ``SETUPTOOLS_SCM_PRETEND_VERSION``
     and ``SETUPTOOLS_SCM_PRETEND_VERSION_FOR_$UPPERCASE_DIST_NAME``
     """
-    import os
-
     from .overrides import EnvReader
 
     log.debug("dist name: %s", config.dist_name)
@@ -241,15 +279,16 @@ def _read_pretended_version_for(
         return None
 
 
-def read_toml_overrides(dist_name: str | None) -> dict[str, Any]:
-    """Read TOML overrides from environment."""
-    import os
+def read_toml_overrides(dist_name: str | None) -> ConfigOverridesDict:
+    """Read TOML overrides from environment.
 
+    Validates that only known Configuration fields are provided.
+    """
     from .overrides import EnvReader
 
     reader = EnvReader(
         tools_names=("SETUPTOOLS_SCM", "VCS_VERSIONING"),
         env=os.environ,
         dist_name=dist_name,
     )
-    return reader.read_toml("OVERRIDES")
+    return reader.read_toml("OVERRIDES", schema=ConfigOverridesDict)
@@ -4,7 +4,7 @@
 import sys
 from collections.abc import Callable
 from pathlib import Path
-from typing import Any, TypeAlias, TypedDict, cast
+from typing import Any, TypeAlias, TypedDict, TypeVar, cast, get_type_hints
 
 if sys.version_info >= (3, 11):
     from tomllib import loads as load_toml
@@ -17,11 +17,18 @@
 TOML_RESULT: TypeAlias = dict[str, Any]
 TOML_LOADER: TypeAlias = Callable[[str], TOML_RESULT]
 
+# TypeVar for generic TypedDict support - the schema defines the return type
+TSchema = TypeVar("TSchema", bound=TypedDict)  # type: ignore[valid-type]
+
 
 class InvalidTomlError(ValueError):
     """Raised when TOML data cannot be parsed."""
 
 
+class InvalidTomlSchemaError(ValueError):
+    """Raised when TOML data does not conform to the expected schema."""
+
+
 def read_toml_content(path: Path, default: TOML_RESULT | None = None) -> TOML_RESULT:
     try:
         data = path.read_text(encoding="utf-8")
@@ -42,17 +49,78 @@ class _CheatTomlData(TypedDict):
     cheat: dict[str, Any]
 
 
-def load_toml_or_inline_map(data: str | None) -> dict[str, Any]:
+def _validate_against_schema(
+    data: dict[str, Any],
+    schema: type[TypedDict] | None,  # type: ignore[valid-type]
+) -> dict[str, Any]:
+    """Validate parsed TOML data against a TypedDict schema.
+
+    Args:
+        data: Parsed TOML data to validate
+        schema: TypedDict class defining valid fields, or None to skip validation
+
+    Returns:
+        The validated data with invalid fields removed
+
+    Raises:
+        InvalidTomlSchemaError: If there are invalid fields (after logging warnings)
     """
-    load toml data - with a special hack if only a inline map is given
+    if schema is None:
+        return data
+
+    # Extract valid field names from the TypedDict
+    try:
+        valid_fields = frozenset(get_type_hints(schema).keys())
+    except NameError as e:
+        # If type hints can't be resolved, log warning and skip validation
+        log.warning("Could not resolve type hints for schema validation: %s", e)
+        return data
+
+    # If the schema has no fields (empty TypedDict), skip validation
+    if not valid_fields:
+        return data
+
+    invalid_fields = set(data.keys()) - valid_fields
+    if invalid_fields:
+        log.warning(
+            "Invalid fields in TOML data: %s. Valid fields are: %s",
+            sorted(invalid_fields),
+            sorted(valid_fields),
+        )
+        # Remove invalid fields
+        validated_data = {k: v for k, v in data.items() if k not in invalid_fields}
+        return validated_data
+
+    return data
+
+
+def load_toml_or_inline_map(data: str | None, *, schema: type[TSchema]) -> TSchema:
+    """Load toml data - with a special hack if only a inline map is given.
+
+    Args:
+        data: TOML string to parse, or None for empty dict
+        schema: TypedDict class for schema validation.
+               Invalid fields will be logged as warnings and removed.
+
+    Returns:
+        Parsed TOML data as a dictionary conforming to the schema type
+
+    Raises:
+        InvalidTomlError: If the TOML content is malformed
     """
     if not data:
-        return {}
+        return {}  # type: ignore[return-value]
     try:
         if data[0] == "{":
             data = "cheat=" + data
             loaded: _CheatTomlData = cast(_CheatTomlData, load_toml(data))
-            return loaded["cheat"]
-        return load_toml(data)
+            result = loaded["cheat"]
+        else:
+            result = load_toml(data)
+
+        return _validate_against_schema(result, schema)  # type: ignore[return-value]
     except Exception as e:  # tomllib/tomli raise different decode errors
+        # Don't re-wrap our own validation errors
+        if isinstance(e, InvalidTomlSchemaError):
+            raise
         raise InvalidTomlError("Invalid TOML content") from e