Spaces:

wandb
/

guardrails-genie

Running

App Files Files Community

ash0ts commited on Nov 22, 2024

Commit

7e16d4f

1 Parent(s): 778809b

Add regex variant workflow

Browse files

Files changed (4) hide show

guardrails_genie/guardrails/pii/__init__.py +0 -0
guardrails_genie/guardrails/pii/regex_pii_guardrail.py +79 -0
guardrails_genie/guardrails/pii/run_regex_model.py +21 -0
guardrails_genie/regex_model.py +65 -0

guardrails_genie/guardrails/pii/__init__.py ADDED Viewed

File without changes

guardrails_genie/guardrails/pii/regex_pii_guardrail.py ADDED Viewed

	@@ -0,0 +1,79 @@

+from typing import Dict, Optional, ClassVar
+import weave
+from pydantic import BaseModel
+from ...regex_model import RegexModel
+from ..base import Guardrail
+class RegexPIIGuardrailResponse(BaseModel):
+    contains_pii: bool
+    detected_pii_types: Dict[str, list[str]]
+    safe_to_process: bool
+    explanation: str
+class RegexPIIGuardrail(Guardrail):
+    regex_model: RegexModel
+    patterns: Dict[str, str] = {}
+    DEFAULT_PII_PATTERNS: ClassVar[Dict[str, str]] = {
+        "email": r"[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}",
+        "phone_number": r"\b(?:\+?1[-.]?)?\(?(?:[0-9]{3})\)?[-.]?(?:[0-9]{3})[-.]?(?:[0-9]{4})\b",
+        "ssn": r"\b\d{3}[-]?\d{2}[-]?\d{4}\b",
+        "credit_card": r"\b\d{4}[-.]?\d{4}[-.]?\d{4}[-.]?\d{4}\b",
+        "ip_address": r"\b\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}\b",
+        "date_of_birth": r"\b\d{2}[-/]\d{2}[-/]\d{4}\b",
+        "passport": r"\b[A-Z]{1,2}[0-9]{6,9}\b",
+        "drivers_license": r"\b[A-Z]\d{7}\b",
+        "bank_account": r"\b\d{8,17}\b",
+        "zip_code": r"\b\d{5}(?:[-]\d{4})?\b"
+    }
+    def __init__(self, use_defaults: bool = True, **kwargs):
+        patterns = {}
+        if use_defaults:
+            patterns = self.DEFAULT_PII_PATTERNS.copy()
+        if kwargs.get("patterns"):
+            patterns.update(kwargs["patterns"])
+        # Create the RegexModel instance
+        regex_model = RegexModel(patterns=patterns)
+        # Initialize the base class with both the regex_model and patterns
+        super().__init__(regex_model=regex_model, patterns=patterns)
+    @weave.op()
+    def guard(self, prompt: str, **kwargs) -> RegexPIIGuardrailResponse:
+        """
+        Check if the input prompt contains any PII based on the regex patterns.
+        Args:
+            prompt: Input text to check for PII
+        Returns:
+            RegexPIIGuardrailResponse containing PII detection results and recommendations
+        """
+        result = self.regex_model.check(prompt)
+        # Create detailed explanation
+        explanation_parts = []
+        if result.matched_patterns:
+            explanation_parts.append("Found the following PII in the text:")
+            for pii_type, matches in result.matched_patterns.items():
+                explanation_parts.append(f"- {pii_type}: {len(matches)} instance(s)")
+        else:
+            explanation_parts.append("No PII detected in the text.")
+        if result.failed_patterns:
+            explanation_parts.append("\nChecked but did not find these PII types:")
+            for pattern in result.failed_patterns:
+                explanation_parts.append(f"- {pattern}")
+        return RegexPIIGuardrailResponse(
+            contains_pii=not result.passed,
+            detected_pii_types=result.matched_patterns,
+            safe_to_process=result.passed,
+            explanation="\n".join(explanation_parts)
+        )

guardrails_genie/guardrails/pii/run_regex_model.py ADDED Viewed

	@@ -0,0 +1,21 @@

+from guardrails_genie.guardrails.pii.regex_pii_guardrail import RegexPIIGuardrail
+import weave
+def run_regex_model():
+    weave.init("guardrails-genie-pii-regex-model")
+    # Create the guardrail
+    pii_guardrail = RegexPIIGuardrail(use_defaults=True)
+    # Check a prompt
+    prompt = "Please contact john.doe@email.com or call 123-456-7890"
+    result = pii_guardrail.guard(prompt)
+    print(result)
+    # Result will contain:
+    # - contains_pii: True
+    # - detected_pii_types: {"email": ["john.doe@email.com"], "phone_number": ["123-456-7890"]}
+    # - safe_to_process: False
+    # - explanation: Detailed explanation of findings
+if __name__ == "__main__":
+    run_regex_model()

guardrails_genie/regex_model.py ADDED Viewed

	@@ -0,0 +1,65 @@

+from typing import List, Dict, Optional
+import re
+import weave
+from pydantic import BaseModel
+class RegexResult(BaseModel):
+    passed: bool
+    matched_patterns: Dict[str, List[str]]
+    failed_patterns: List[str]
+class RegexModel(weave.Model):
+    patterns: Dict[str, str]
+    def __init__(self, patterns: Dict[str, str]) -> None:
+        """
+        Initialize RegexModel with a dictionary of patterns.
+        Args:
+            patterns: Dictionary where key is pattern name and value is regex pattern
+                     Example: {"email": r"[^@ \t\r\n]+@[^@ \t\r\n]+\.[^@ \t\r\n]+",
+                              "phone": r"\b\d{3}[-.]?\d{3}[-.]?\d{4}\b"}
+        """
+        super().__init__(patterns=patterns)
+        self._compiled_patterns = {
+            name: re.compile(pattern) for name, pattern in patterns.items()
+        }
+    @weave.op()
+    def check(self, text: str) -> RegexResult:
+        """
+        Check text against all patterns and return detailed results.
+        Args:
+            text: Input text to check against patterns
+        Returns:
+            RegexResult containing pass/fail status and details about matches
+        """
+        matches: Dict[str, List[str]] = {}
+        failed_patterns: List[str] = []
+        for pattern_name, compiled_pattern in self._compiled_patterns.items():
+            found_matches = compiled_pattern.findall(text)
+            if found_matches:
+                matches[pattern_name] = found_matches
+            else:
+                failed_patterns.append(pattern_name)
+        # Consider it passed only if no patterns matched (no PII found)
+        passed = len(matches) == 0
+        return RegexResult(
+            passed=passed,
+            matched_patterns=matches,
+            failed_patterns=failed_patterns
+        )
+    @weave.op()
+    def predict(self, text: str) -> RegexResult:
+        """
+        Alias for check() to maintain consistency with other models.
+        """
+        return self.check(text)