guardrails-ai
diff --git a/‎guardrails/validators.py‎
Lines changed: 0 additions & 2540 deletions b/‎guardrails/validators.py‎
Lines changed: 0 additions & 2540 deletions
diff --git a/‎guardrails/validators/__init__.py‎
Lines changed: 88 additions & 0 deletions b/‎guardrails/validators/__init__.py‎
Lines changed: 88 additions & 0 deletions
diff --git a/‎guardrails/validators/bug_free_python.py‎
Lines changed: 44 additions & 0 deletions b/‎guardrails/validators/bug_free_python.py‎
Lines changed: 44 additions & 0 deletions
diff --git a/‎guardrails/validators/bug_free_sql.py‎
Lines changed: 46 additions & 0 deletions b/‎guardrails/validators/bug_free_sql.py‎
Lines changed: 46 additions & 0 deletions
diff --git a/‎guardrails/validators/detect_secrets.py‎
Lines changed: 196 additions & 0 deletions b/‎guardrails/validators/detect_secrets.py‎
Lines changed: 196 additions & 0 deletions
@@ -0,0 +1,88 @@
+"""This module contains the validators for the Guardrails framework.
+
+The name with which a validator is registered is the name that is used
+in the `RAIL` spec to specify formatters.
+"""
+
+from guardrails.validator_base import (
+    FailResult,
+    PassResult,
+    ValidationResult,
+    Validator,
+    register_validator,
+)
+from guardrails.validators.bug_free_python import BugFreePython
+from guardrails.validators.bug_free_sql import BugFreeSQL
+from guardrails.validators.detect_secrets import DetectSecrets, detect_secrets
+from guardrails.validators.endpoint_is_reachable import EndpointIsReachable
+from guardrails.validators.ends_with import EndsWith
+from guardrails.validators.exclude_sql_predicates import ExcludeSqlPredicates
+from guardrails.validators.extracted_summary_sentences_match import (
+    ExtractedSummarySentencesMatch,
+)
+from guardrails.validators.extractive_summary import ExtractiveSummary
+from guardrails.validators.is_high_quality_translation import IsHighQualityTranslation
+from guardrails.validators.is_profanity_free import IsProfanityFree
+from guardrails.validators.lower_case import LowerCase
+from guardrails.validators.one_line import OneLine
+from guardrails.validators.pii_filter import AnalyzerEngine, AnonymizerEngine, PIIFilter
+from guardrails.validators.provenance import ProvenanceV0, ProvenanceV1
+from guardrails.validators.pydantic_field_validator import PydanticFieldValidator
+from guardrails.validators.qa_relevance_llm_eval import QARelevanceLLMEval
+from guardrails.validators.reading_time import ReadingTime
+from guardrails.validators.regex_match import RegexMatch
+from guardrails.validators.remove_redundant_sentences import RemoveRedundantSentences
+from guardrails.validators.saliency_check import SaliencyCheck
+from guardrails.validators.similar_to_document import SimilarToDocument
+from guardrails.validators.similar_to_list import SimilarToList
+from guardrails.validators.sql_column_presence import SqlColumnPresence
+from guardrails.validators.two_words import TwoWords
+from guardrails.validators.upper_case import UpperCase
+from guardrails.validators.valid_choices import ValidChoices
+from guardrails.validators.valid_length import ValidLength
+from guardrails.validators.valid_range import ValidRange
+from guardrails.validators.valid_url import ValidURL
+
+__all__ = [
+    # Validators
+    "PydanticFieldValidator",
+    "ValidRange",
+    "ValidChoices",
+    "LowerCase",
+    "UpperCase",
+    "ValidLength",
+    "RegexMatch",
+    "TwoWords",
+    "OneLine",
+    "ValidURL",
+    "EndpointIsReachable",
+    "BugFreePython",
+    "BugFreeSQL",
+    "SqlColumnPresence",
+    "ExcludeSqlPredicates",
+    "SimilarToDocument",
+    "IsProfanityFree",
+    "IsHighQualityTranslation",
+    "EndsWith",
+    "ExtractedSummarySentencesMatch",
+    "ReadingTime",
+    "ExtractiveSummary",
+    "RemoveRedundantSentences",
+    "SaliencyCheck",
+    "QARelevanceLLMEval",
+    "ProvenanceV0",
+    "ProvenanceV1",
+    "PIIFilter",
+    "SimilarToList",
+    "DetectSecrets",
+    # Validator helpers
+    "detect_secrets",
+    "AnalyzerEngine",
+    "AnonymizerEngine",
+    # Base classes
+    "Validator",
+    "register_validator",
+    "ValidationResult",
+    "PassResult",
+    "FailResult",
+]
@@ -0,0 +1,44 @@
+import ast
+import logging
+from typing import Any, Dict
+
+from guardrails.validator_base import (
+    FailResult,
+    PassResult,
+    ValidationResult,
+    Validator,
+    register_validator,
+)
+
+logger = logging.getLogger(__name__)
+
+
+@register_validator(name="bug-free-python", data_type="string")
+class BugFreePython(Validator):
+    """Validates that there are no Python syntactic bugs in the generated code.
+
+    This validator checks for syntax errors by running `ast.parse(code)`,
+    and will raise an exception if there are any.
+    Only the packages in the `python` environment are available to the code snippet.
+
+    **Key Properties**
+
+    | Property                      | Description                       |
+    | ----------------------------- | --------------------------------- |
+    | Name for `format` attribute   | `bug-free-python`                 |
+    | Supported data types          | `string`                          |
+    | Programmatic fix              | None                              |
+    """
+
+    def validate(self, value: Any, metadata: Dict) -> ValidationResult:
+        logger.debug(f"Validating {value} is not a bug...")
+
+        # The value is a Python code snippet. We need to check for syntax errors.
+        try:
+            ast.parse(value)
+        except SyntaxError as e:
+            return FailResult(
+                error_message=f"Syntax error: {e.msg}",
+            )
+
+        return PassResult()
@@ -0,0 +1,46 @@
+from typing import Any, Callable, Dict, Optional
+
+from guardrails.utils.sql_utils import SQLDriver, create_sql_driver
+from guardrails.validator_base import (
+    FailResult,
+    PassResult,
+    ValidationResult,
+    Validator,
+    register_validator,
+)
+
+
+@register_validator(name="bug-free-sql", data_type=["string"])
+class BugFreeSQL(Validator):
+    """Validates that there are no SQL syntactic bugs in the generated code.
+
+    This is a very minimal implementation that uses the Pypi `sqlvalidator` package
+    to check if the SQL query is valid. You can implement a custom SQL validator
+    that uses a database connection to check if the query is valid.
+
+    **Key Properties**
+
+    | Property                      | Description                       |
+    | ----------------------------- | --------------------------------- |
+    | Name for `format` attribute   | `bug-free-sql`                    |
+    | Supported data types          | `string`                          |
+    | Programmatic fix              | None                              |
+    """
+
+    def __init__(
+        self,
+        conn: Optional[str] = None,
+        schema_file: Optional[str] = None,
+        on_fail: Optional[Callable] = None,
+    ):
+        super().__init__(on_fail=on_fail)
+        self._driver: SQLDriver = create_sql_driver(schema_file=schema_file, conn=conn)
+
+    def validate(self, value: Any, metadata: Dict) -> ValidationResult:
+        errors = self._driver.validate_sql(value)
+        if len(errors) > 0:
+            return FailResult(
+                error_message=". ".join(errors),
+            )
+
+        return PassResult()
@@ -0,0 +1,196 @@
+import os
+import warnings
+from typing import Any, Callable, Dict, List, Tuple, Union
+
+from guardrails.validator_base import (
+    FailResult,
+    PassResult,
+    ValidationResult,
+    Validator,
+    register_validator,
+)
+
+try:
+    import detect_secrets  # type: ignore
+except ImportError:
+    detect_secrets = None
+
+
+@register_validator(name="detect-secrets", data_type="string")
+class DetectSecrets(Validator):
+    """Validates whether the generated code snippet contains any secrets.
+
+    **Key Properties**
+    | Property                      | Description                       |
+    | ----------------------------- | --------------------------------- |
+    | Name for `format` attribute   | `detect-secrets`                  |
+    | Supported data types          | `string`                          |
+    | Programmatic fix              | None                              |
+
+    Parameters: Arguments
+        None
+
+    This validator uses the detect-secrets library to check whether the generated code
+    snippet contains any secrets. If any secrets are detected, the validator fails and
+    returns the generated code snippet with the secrets replaced with asterisks.
+    Else the validator returns the generated code snippet.
+
+    Following are some caveats:
+        - Multiple secrets on the same line may not be caught. e.g.
+            - Minified code
+            - One-line lists/dictionaries
+            - Multi-variable assignments
+        - Multi-line secrets may not be caught. e.g.
+            - RSA/SSH keys
+
+    Example:
+        ```py
+
+        guard = Guard.from_string(validators=[
+            DetectSecrets(on_fail="fix")
+        ])
+        guard.parse(
+            llm_output=code_snippet,
+        )
+    """
+
+    def __init__(self, on_fail: Union[Callable[..., Any], None] = None, **kwargs):
+        super().__init__(on_fail, **kwargs)
+
+        # Check if detect-secrets is installed
+        if detect_secrets is None:
+            raise ValueError(
+                "You must install detect-secrets in order to "
+                "use the DetectSecrets validator."
+            )
+        self.temp_file_name = "temp.txt"
+        self.mask = "********"
+
+    def get_unique_secrets(self, value: str) -> Tuple[Dict[str, Any], List[str]]:
+        """Get unique secrets from the value.
+
+        Args:
+            value (str): The generated code snippet.
+
+        Returns:
+            unique_secrets (Dict[str, Any]): A dictionary of unique secrets and their
+                line numbers.
+            lines (List[str]): The lines of the generated code snippet.
+        """
+        try:
+            # Write each line of value to a new file
+            with open(self.temp_file_name, "w") as f:
+                f.writelines(value)
+        except Exception as e:
+            raise OSError(
+                "Problems creating or deleting the temporary file. "
+                "Please check the permissions of the current directory."
+            ) from e
+
+        try:
+            # Create a new secrets collection
+            from detect_secrets import settings
+            from detect_secrets.core.secrets_collection import SecretsCollection
+
+            secrets = SecretsCollection()
+
+            # Scan the file for secrets
+            with settings.default_settings():
+                secrets.scan_file(self.temp_file_name)
+        except ImportError:
+            raise ValueError(
+                "You must install detect-secrets in order to "
+                "use the DetectSecrets validator."
+            )
+        except Exception as e:
+            raise RuntimeError(
+                "Problems with creating a SecretsCollection or "
+                "scanning the file for secrets."
+            ) from e
+
+        # Get unique secrets from these secrets
+        unique_secrets = {}
+        for secret in secrets:
+            _, potential_secret = secret
+            actual_secret = potential_secret.secret_value
+            line_number = potential_secret.line_number
+            if actual_secret not in unique_secrets:
+                unique_secrets[actual_secret] = [line_number]
+            else:
+                # if secret already exists, avoid duplicate line numbers
+                if line_number not in unique_secrets[actual_secret]:
+                    unique_secrets[actual_secret].append(line_number)
+
+        try:
+            # File no longer needed, read the lines from the file
+            with open(self.temp_file_name, "r") as f:
+                lines = f.readlines()
+        except Exception as e:
+            raise OSError(
+                "Problems reading the temporary file. "
+                "Please check the permissions of the current directory."
+            ) from e
+
+        try:
+            # Delete the file
+            os.remove(self.temp_file_name)
+        except Exception as e:
+            raise OSError(
+                "Problems deleting the temporary file. "
+                "Please check the permissions of the current directory."
+            ) from e
+        return unique_secrets, lines
+
+    def get_modified_value(
+        self, unique_secrets: Dict[str, Any], lines: List[str]
+    ) -> str:
+        """Replace the secrets on the lines with asterisks.
+
+        Args:
+            unique_secrets (Dict[str, Any]): A dictionary of unique secrets and their
+                line numbers.
+            lines (List[str]): The lines of the generated code snippet.
+
+        Returns:
+            modified_value (str): The generated code snippet with secrets replaced with
+                asterisks.
+        """
+        # Replace the secrets on the lines with asterisks
+        for secret, line_numbers in unique_secrets.items():
+            for line_number in line_numbers:
+                lines[line_number - 1] = lines[line_number - 1].replace(
+                    secret, self.mask
+                )
+
+        # Convert lines to a multiline string
+        modified_value = "".join(lines)
+        return modified_value
+
+    def validate(self, value: str, metadata: Dict[str, Any]) -> ValidationResult:
+        # Check if value is a multiline string
+        if "\n" not in value:
+            # Raise warning if value is not a multiline string
+            warnings.warn(
+                "The DetectSecrets validator works best with "
+                "multiline code snippets. "
+                "Refer validator docs for more details."
+            )
+
+            # Add a newline to value
+            value += "\n"
+
+        # Get unique secrets from the value
+        unique_secrets, lines = self.get_unique_secrets(value)
+
+        if unique_secrets:
+            # Replace the secrets on the lines with asterisks
+            modified_value = self.get_modified_value(unique_secrets, lines)
+
+            return FailResult(
+                error_message=(
+                    "The following secrets were detected in your response:\n"
+                    + "\n".join(unique_secrets.keys())
+                ),
+                fix_value=modified_value,
+            )
+        return PassResult()