Spaces:

wandb
/

guardrails-genie

Running

App Files Files Community

geekyrakshit commited on Dec 3, 2024

Commit

78a1bf0

1 Parent(s): 36c3c0f

add: docs for AccuracyMetric

Browse files

Files changed (19) hide show

guardrails_genie/guardrails/__init__.py +5 -5
guardrails_genie/guardrails/entity_recognition/__init__.py +7 -4
guardrails_genie/guardrails/entity_recognition/banned_terms_examples/banned_term_examples.py +64 -32
guardrails_genie/guardrails/entity_recognition/banned_terms_examples/run_llm_judge.py +12 -10
guardrails_genie/guardrails/entity_recognition/banned_terms_examples/run_regex_model.py +12 -8
guardrails_genie/guardrails/entity_recognition/llm_judge_entity_recognition_guardrail.py +45 -21
guardrails_genie/guardrails/entity_recognition/pii_examples/pii_benchmark.py +139 -81
guardrails_genie/guardrails/entity_recognition/pii_examples/pii_benchmark_weave.py +141 -90
guardrails_genie/guardrails/entity_recognition/pii_examples/pii_test_examples.py +27 -23
guardrails_genie/guardrails/entity_recognition/pii_examples/run_presidio_model.py +13 -5
guardrails_genie/guardrails/entity_recognition/pii_examples/run_regex_model.py +13 -5
guardrails_genie/guardrails/entity_recognition/pii_examples/run_transformers.py +20 -5
guardrails_genie/guardrails/entity_recognition/presidio_entity_recognition_guardrail.py +60 -46
guardrails_genie/guardrails/entity_recognition/regex_entity_recognition_guardrail.py +69 -41
guardrails_genie/guardrails/entity_recognition/transformers_entity_recognition_guardrail.py +81 -47
guardrails_genie/guardrails/manager.py +1 -1
guardrails_genie/metrics.py +44 -1
guardrails_genie/regex_model.py +13 -10
guardrails_genie/utils.py +12 -11

guardrails_genie/guardrails/__init__.py CHANGED Viewed

@@ -1,12 +1,12 @@
-from .injection import (
-    PromptInjectionClassifierGuardrail,
-    PromptInjectionSurveyGuardrail,
-)
 from .entity_recognition import (
     PresidioEntityRecognitionGuardrail,
     RegexEntityRecognitionGuardrail,
-    TransformersEntityRecognitionGuardrail,
     RestrictedTermsJudge,
 )
 from .manager import GuardrailManager

 from .entity_recognition import (
     PresidioEntityRecognitionGuardrail,
     RegexEntityRecognitionGuardrail,
     RestrictedTermsJudge,
+    TransformersEntityRecognitionGuardrail,
+)
+from .injection import (
+    PromptInjectionClassifierGuardrail,
+    PromptInjectionSurveyGuardrail,
 )
 from .manager import GuardrailManager

guardrails_genie/guardrails/entity_recognition/__init__.py CHANGED Viewed

@@ -1,10 +1,13 @@
-from .presidio_entity_recognition_guardrail import PresidioEntityRecognitionGuardrail
-from .regex_entity_recognition_guardrail import RegexEntityRecognitionGuardrail
-from .transformers_entity_recognition_guardrail import TransformersEntityRecognitionGuardrail
 from .llm_judge_entity_recognition_guardrail import RestrictedTermsJudge
 __all__ = [
     "PresidioEntityRecognitionGuardrail",
     "RegexEntityRecognitionGuardrail",
     "TransformersEntityRecognitionGuardrail",
-    "RestrictedTermsJudge"
 ]

 from .llm_judge_entity_recognition_guardrail import RestrictedTermsJudge
+from .presidio_entity_recognition_guardrail import PresidioEntityRecognitionGuardrail
+from .regex_entity_recognition_guardrail import RegexEntityRecognitionGuardrail
+from .transformers_entity_recognition_guardrail import (
+    TransformersEntityRecognitionGuardrail,
+)
 __all__ = [
     "PresidioEntityRecognitionGuardrail",
     "RegexEntityRecognitionGuardrail",
     "TransformersEntityRecognitionGuardrail",
+    "RestrictedTermsJudge",
 ]

guardrails_genie/guardrails/entity_recognition/banned_terms_examples/banned_term_examples.py CHANGED Viewed

@@ -11,15 +11,22 @@ I think we should implement features similar to Salesforce's Einstein AI
 and Oracle's Cloud Infrastructure. Maybe we could also look at how
 AWS handles their lambda functions.
 """,
-        "custom_terms": ["Salesforce", "Oracle", "AWS", "Einstein AI", "Cloud Infrastructure", "lambda"],
         "expected_entities": {
             "Salesforce": ["Salesforce"],
             "Oracle": ["Oracle"],
             "AWS": ["AWS"],
             "Einstein AI": ["Einstein AI"],
             "Cloud Infrastructure": ["Cloud Infrastructure"],
-            "lambda": ["lambda"]
-        }
     },
     {
         "description": "Inappropriate Language in Support Ticket",
@@ -32,8 +39,8 @@ stupid service? I've wasted so much freaking time on this crap.
             "damn": ["damn"],
             "hell": ["hell"],
             "stupid": ["stupid"],
-            "crap": ["crap"]
-        }
     },
     {
         "description": "Confidential Project Names",
@@ -45,9 +52,9 @@ with Project Phoenix team and the Blue Dragon initiative for resource allocation
         "expected_entities": {
             "Project Titan": ["Project Titan"],
             "Project Phoenix": ["Project Phoenix"],
-            "Blue Dragon": ["Blue Dragon"]
-        }
-    }
 ]
 # Edge cases and special formats
@@ -59,15 +66,22 @@ MSFT's Azure and O365 platform is gaining market share.
 Have you seen what GOOGL/GOOG and FB/META are doing with their AI?
 CRM (Salesforce) and ORCL (Oracle) have interesting features too.
 """,
-        "custom_terms": ["Microsoft", "Google", "Meta", "Facebook", "Salesforce", "Oracle"],
         "expected_entities": {
             "Microsoft": ["MSFT"],
             "Google": ["GOOGL", "GOOG"],
             "Meta": ["META"],
             "Facebook": ["FB"],
             "Salesforce": ["CRM", "Salesforce"],
-            "Oracle": ["ORCL"]
-        }
     },
     {
         "description": "L33t Speak and Intentional Obfuscation",
@@ -76,15 +90,22 @@ S4l3sf0rc3 is better than 0r4cl3!
 M1cr0$oft and G00gl3 are the main competitors.
 Let's check F8book and Met@ too.
 """,
-        "custom_terms": ["Salesforce", "Oracle", "Microsoft", "Google", "Facebook", "Meta"],
         "expected_entities": {
             "Salesforce": ["S4l3sf0rc3"],
             "Oracle": ["0r4cl3"],
             "Microsoft": ["M1cr0$oft"],
             "Google": ["G00gl3"],
             "Facebook": ["F8book"],
-            "Meta": ["Met@"]
-        }
     },
     {
         "description": "Case Variations and Partial Matches",
@@ -98,8 +119,8 @@ Have you tried micro-soft or Google_Cloud?
             "Microsoft": ["MicroSoft", "micro-soft"],
             "Google": ["google", "Google_Cloud"],
             "Salesforce": ["salesFORCE"],
-            "Oracle": ["ORACLE"]
-        }
     },
     {
         "description": "Common Misspellings and Typos",
@@ -113,8 +134,8 @@ Salezforce and Oracel need checking too.
             "Microsoft": ["Microsft", "Microsooft"],
             "Google": ["Goggle", "Googel", "Gooogle"],
             "Salesforce": ["Salezforce"],
-            "Oracle": ["Oracel"]
-        }
     },
     {
         "description": "Mixed Variations and Context",
@@ -123,7 +144,15 @@ The M$ cloud competes with AWS (Amazon Web Services).
 FB/Meta's social platform and GOOGL's search dominate.
 SF.com and Oracle-DB are industry standards.
 """,
-        "custom_terms": ["Microsoft", "Amazon Web Services", "Facebook", "Meta", "Google", "Salesforce", "Oracle"],
         "expected_entities": {
             "Microsoft": ["M$"],
             "Amazon Web Services": ["AWS"],
@@ -131,37 +160,40 @@ SF.com and Oracle-DB are industry standards.
             "Meta": ["Meta"],
             "Google": ["GOOGL"],
             "Salesforce": ["SF.com"],
-            "Oracle": ["Oracle-DB"]
-        }
-    }
 ]
 def validate_entities(detected: dict, expected: dict) -> bool:
     """Compare detected entities with expected entities"""
     if set(detected.keys()) != set(expected.keys()):
         return False
     return all(set(detected[k]) == set(expected[k]) for k in expected.keys())
 def run_test_case(guardrail, test_case, test_type="Main"):
     """Run a single test case and print results"""
     print(f"\n{test_type} Test Case: {test_case['description']}")
     print("-" * 50)
     result = guardrail.guard(
-        test_case['input_text'],
-        custom_terms=test_case['custom_terms']
     )
-    expected = test_case['expected_entities']
     # Validate results
     matches = validate_entities(result.detected_entities, expected)
     print(f"Test Status: {'✓ PASS' if matches else '✗ FAIL'}")
     print(f"Contains Restricted Terms: {result.contains_entities}")
     if not matches:
         print("\nEntity Comparison:")
-        all_entity_types = set(list(result.detected_entities.keys()) + list(expected.keys()))
         for entity_type in all_entity_types:
             detected = set(result.detected_entities.get(entity_type, []))
             expected_set = set(expected.get(entity_type, []))
@@ -171,8 +203,8 @@ def run_test_case(guardrail, test_case, test_type="Main"):
             if detected != expected_set:
                 print(f"  Missing: {sorted(expected_set - detected)}")
                 print(f"  Extra: {sorted(detected - expected_set)}")
     if result.anonymized_text:
         print(f"\nAnonymized Text:\n{result.anonymized_text}")
     return matches

 and Oracle's Cloud Infrastructure. Maybe we could also look at how
 AWS handles their lambda functions.
 """,
+        "custom_terms": [
+            "Salesforce",
+            "Oracle",
+            "AWS",
+            "Einstein AI",
+            "Cloud Infrastructure",
+            "lambda",
+        ],
         "expected_entities": {
             "Salesforce": ["Salesforce"],
             "Oracle": ["Oracle"],
             "AWS": ["AWS"],
             "Einstein AI": ["Einstein AI"],
             "Cloud Infrastructure": ["Cloud Infrastructure"],
+            "lambda": ["lambda"],
+        },
     },
     {
         "description": "Inappropriate Language in Support Ticket",
             "damn": ["damn"],
             "hell": ["hell"],
             "stupid": ["stupid"],
+            "crap": ["crap"],
+        },
     },
     {
         "description": "Confidential Project Names",
         "expected_entities": {
             "Project Titan": ["Project Titan"],
             "Project Phoenix": ["Project Phoenix"],
+            "Blue Dragon": ["Blue Dragon"],
+        },
+    },
 ]
 # Edge cases and special formats
 Have you seen what GOOGL/GOOG and FB/META are doing with their AI?
 CRM (Salesforce) and ORCL (Oracle) have interesting features too.
 """,
+        "custom_terms": [
+            "Microsoft",
+            "Google",
+            "Meta",
+            "Facebook",
+            "Salesforce",
+            "Oracle",
+        ],
         "expected_entities": {
             "Microsoft": ["MSFT"],
             "Google": ["GOOGL", "GOOG"],
             "Meta": ["META"],
             "Facebook": ["FB"],
             "Salesforce": ["CRM", "Salesforce"],
+            "Oracle": ["ORCL"],
+        },
     },
     {
         "description": "L33t Speak and Intentional Obfuscation",
 M1cr0$oft and G00gl3 are the main competitors.
 Let's check F8book and Met@ too.
 """,
+        "custom_terms": [
+            "Salesforce",
+            "Oracle",
+            "Microsoft",
+            "Google",
+            "Facebook",
+            "Meta",
+        ],
         "expected_entities": {
             "Salesforce": ["S4l3sf0rc3"],
             "Oracle": ["0r4cl3"],
             "Microsoft": ["M1cr0$oft"],
             "Google": ["G00gl3"],
             "Facebook": ["F8book"],
+            "Meta": ["Met@"],
+        },
     },
     {
         "description": "Case Variations and Partial Matches",
             "Microsoft": ["MicroSoft", "micro-soft"],
             "Google": ["google", "Google_Cloud"],
             "Salesforce": ["salesFORCE"],
+            "Oracle": ["ORACLE"],
+        },
     },
     {
         "description": "Common Misspellings and Typos",
             "Microsoft": ["Microsft", "Microsooft"],
             "Google": ["Goggle", "Googel", "Gooogle"],
             "Salesforce": ["Salezforce"],
+            "Oracle": ["Oracel"],
+        },
     },
     {
         "description": "Mixed Variations and Context",
 FB/Meta's social platform and GOOGL's search dominate.
 SF.com and Oracle-DB are industry standards.
 """,
+        "custom_terms": [
+            "Microsoft",
+            "Amazon Web Services",
+            "Facebook",
+            "Meta",
+            "Google",
+            "Salesforce",
+            "Oracle",
+        ],
         "expected_entities": {
             "Microsoft": ["M$"],
             "Amazon Web Services": ["AWS"],
             "Meta": ["Meta"],
             "Google": ["GOOGL"],
             "Salesforce": ["SF.com"],
+            "Oracle": ["Oracle-DB"],
+        },
+    },
 ]
 def validate_entities(detected: dict, expected: dict) -> bool:
     """Compare detected entities with expected entities"""
     if set(detected.keys()) != set(expected.keys()):
         return False
     return all(set(detected[k]) == set(expected[k]) for k in expected.keys())
 def run_test_case(guardrail, test_case, test_type="Main"):
     """Run a single test case and print results"""
     print(f"\n{test_type} Test Case: {test_case['description']}")
     print("-" * 50)
     result = guardrail.guard(
+        test_case["input_text"], custom_terms=test_case["custom_terms"]
     )
+    expected = test_case["expected_entities"]
     # Validate results
     matches = validate_entities(result.detected_entities, expected)
     print(f"Test Status: {'✓ PASS' if matches else '✗ FAIL'}")
     print(f"Contains Restricted Terms: {result.contains_entities}")
     if not matches:
         print("\nEntity Comparison:")
+        all_entity_types = set(
+            list(result.detected_entities.keys()) + list(expected.keys())
+        )
         for entity_type in all_entity_types:
             detected = set(result.detected_entities.get(entity_type, []))
             expected_set = set(expected.get(entity_type, []))
             if detected != expected_set:
                 print(f"  Missing: {sorted(expected_set - detected)}")
                 print(f"  Extra: {sorted(detected - expected_set)}")
     if result.anonymized_text:
         print(f"\nAnonymized Text:\n{result.anonymized_text}")
     return matches

guardrails_genie/guardrails/entity_recognition/banned_terms_examples/run_llm_judge.py CHANGED Viewed

@@ -1,21 +1,22 @@
-from guardrails_genie.guardrails.entity_recognition.llm_judge_entity_recognition_guardrail import RestrictedTermsJudge
 from guardrails_genie.guardrails.entity_recognition.banned_terms_examples.banned_term_examples import (
-    RESTRICTED_TERMS_EXAMPLES,
-    EDGE_CASE_EXAMPLES,
-    run_test_case
 )
 from guardrails_genie.llm import OpenAIModel
-import weave
 def test_restricted_terms_detection():
     """Test restricted terms detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-restricted-terms-llm-judge")
     # Create the guardrail with OpenAI model
-    llm_judge = RestrictedTermsJudge(
-        should_anonymize=True,
-        llm_model=OpenAIModel()
-    )
     # Test statistics
     total_tests = len(RESTRICTED_TERMS_EXAMPLES) + len(EDGE_CASE_EXAMPLES)
@@ -43,5 +44,6 @@ def test_restricted_terms_detection():
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_restricted_terms_detection()

+import weave
 from guardrails_genie.guardrails.entity_recognition.banned_terms_examples.banned_term_examples import (
+    EDGE_CASE_EXAMPLES,
+    RESTRICTED_TERMS_EXAMPLES,
+    run_test_case,
+)
+from guardrails_genie.guardrails.entity_recognition.llm_judge_entity_recognition_guardrail import (
+    RestrictedTermsJudge,
 )
 from guardrails_genie.llm import OpenAIModel
 def test_restricted_terms_detection():
     """Test restricted terms detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-restricted-terms-llm-judge")
     # Create the guardrail with OpenAI model
+    llm_judge = RestrictedTermsJudge(should_anonymize=True, llm_model=OpenAIModel())
     # Test statistics
     total_tests = len(RESTRICTED_TERMS_EXAMPLES) + len(EDGE_CASE_EXAMPLES)
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_restricted_terms_detection()

guardrails_genie/guardrails/entity_recognition/banned_terms_examples/run_regex_model.py CHANGED Viewed

@@ -1,19 +1,22 @@
-from guardrails_genie.guardrails.entity_recognition.regex_entity_recognition_guardrail import RegexEntityRecognitionGuardrail
 from guardrails_genie.guardrails.entity_recognition.banned_terms_examples.banned_term_examples import (
-    RESTRICTED_TERMS_EXAMPLES,
-    EDGE_CASE_EXAMPLES,
-    run_test_case
 )
-import weave
 def test_restricted_terms_detection():
     """Test restricted terms detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-restricted-terms-regex-model")
     # Create the guardrail with anonymization enabled
     regex_guardrail = RegexEntityRecognitionGuardrail(
-        use_defaults=False,  # Don't use default PII patterns
-        should_anonymize=True
     )
     # Test statistics
@@ -42,5 +45,6 @@ def test_restricted_terms_detection():
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_restricted_terms_detection()

+import weave
 from guardrails_genie.guardrails.entity_recognition.banned_terms_examples.banned_term_examples import (
+    EDGE_CASE_EXAMPLES,
+    RESTRICTED_TERMS_EXAMPLES,
+    run_test_case,
+)
+from guardrails_genie.guardrails.entity_recognition.regex_entity_recognition_guardrail import (
+    RegexEntityRecognitionGuardrail,
 )
 def test_restricted_terms_detection():
     """Test restricted terms detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-restricted-terms-regex-model")
     # Create the guardrail with anonymization enabled
     regex_guardrail = RegexEntityRecognitionGuardrail(
+        use_defaults=False, should_anonymize=True  # Don't use default PII patterns
     )
     # Test statistics
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_restricted_terms_detection()

guardrails_genie/guardrails/entity_recognition/llm_judge_entity_recognition_guardrail.py CHANGED Viewed

@@ -1,15 +1,16 @@
 from typing import Dict, List, Optional
 import weave
 from pydantic import BaseModel, Field
-from typing_extensions import Annotated
 from ...llm import OpenAIModel
 from ..base import Guardrail
-import instructor
 class TermMatch(BaseModel):
     """Represents a matched term and its variations"""
     original_term: str
     matched_text: str
     match_type: str = Field(
@@ -22,19 +23,18 @@ class TermMatch(BaseModel):
 class RestrictedTermsAnalysis(BaseModel):
     """Analysis result for restricted terms detection"""
     contains_restricted_terms: bool = Field(
         description="Whether any restricted terms were detected"
     )
     detected_matches: List[TermMatch] = Field(
         default_factory=list,
-        description="List of detected term matches with their variations"
-    )
-    explanation: str = Field(
-        description="Detailed explanation of the analysis"
     )
     anonymized_text: Optional[str] = Field(
         default=None,
-        description="Text with restricted terms replaced with category tags"
     )
     @property
@@ -106,39 +106,57 @@ Return your analysis in the structured format specified by the RestrictedTermsAn
         return user_prompt, system_prompt
     @weave.op()
-    def predict(self, text: str, custom_terms: List[str], **kwargs) -> RestrictedTermsAnalysis:
         user_prompt, system_prompt = self.format_prompts(text, custom_terms)
         response = self.llm_model.predict(
             user_prompts=user_prompt,
             system_prompt=system_prompt,
             response_format=RestrictedTermsAnalysis,
             temperature=0.1,  # Lower temperature for more consistent analysis
-            **kwargs
         )
         return response.choices[0].message.parsed
-    #TODO: Remove default custom_terms
     @weave.op()
-    def guard(self, text: str, custom_terms: List[str] = ["Microsoft", "Amazon Web Services", "Facebook", "Meta", "Google", "Salesforce", "Oracle"], aggregate_redaction: bool = True, **kwargs) -> RestrictedTermsRecognitionResponse:
         """
         Guard against restricted terms and their variations.
         Args:
             text: Text to analyze
             custom_terms: List of restricted terms to check for
         Returns:
             RestrictedTermsRecognitionResponse containing safety assessment and detailed analysis
         """
         analysis = self.predict(text, custom_terms, **kwargs)
         # Create a summary of findings
         if analysis.contains_restricted_terms:
             summary_parts = ["Restricted terms detected:"]
             for match in analysis.detected_matches:
-                summary_parts.append(f"\n- {match.original_term}: {match.matched_text} ({match.match_type})")
             summary = "\n".join(summary_parts)
         else:
             summary = "No restricted terms detected."
@@ -148,8 +166,14 @@ Return your analysis in the structured format specified by the RestrictedTermsAn
         if self.should_anonymize and analysis.contains_restricted_terms:
             anonymized_text = text
             for match in analysis.detected_matches:
-                replacement = "[redacted]" if aggregate_redaction else f"[{match.match_type.upper()}]"
-                anonymized_text = anonymized_text.replace(match.matched_text, replacement)
         # Convert detected_matches to a dictionary format
         detected_entities = {}
@@ -162,5 +186,5 @@ Return your analysis in the structured format specified by the RestrictedTermsAn
             contains_entities=analysis.contains_restricted_terms,
             detected_entities=detected_entities,
             explanation=summary,
-            anonymized_text=anonymized_text
-        )

 from typing import Dict, List, Optional
+import instructor
 import weave
 from pydantic import BaseModel, Field
 from ...llm import OpenAIModel
 from ..base import Guardrail
 class TermMatch(BaseModel):
     """Represents a matched term and its variations"""
     original_term: str
     matched_text: str
     match_type: str = Field(
 class RestrictedTermsAnalysis(BaseModel):
     """Analysis result for restricted terms detection"""
     contains_restricted_terms: bool = Field(
         description="Whether any restricted terms were detected"
     )
     detected_matches: List[TermMatch] = Field(
         default_factory=list,
+        description="List of detected term matches with their variations",
     )
+    explanation: str = Field(description="Detailed explanation of the analysis")
     anonymized_text: Optional[str] = Field(
         default=None,
+        description="Text with restricted terms replaced with category tags",
     )
     @property
         return user_prompt, system_prompt
     @weave.op()
+    def predict(
+        self, text: str, custom_terms: List[str], **kwargs
+    ) -> RestrictedTermsAnalysis:
         user_prompt, system_prompt = self.format_prompts(text, custom_terms)
         response = self.llm_model.predict(
             user_prompts=user_prompt,
             system_prompt=system_prompt,
             response_format=RestrictedTermsAnalysis,
             temperature=0.1,  # Lower temperature for more consistent analysis
+            **kwargs,
         )
         return response.choices[0].message.parsed
+    # TODO: Remove default custom_terms
     @weave.op()
+    def guard(
+        self,
+        text: str,
+        custom_terms: List[str] = [
+            "Microsoft",
+            "Amazon Web Services",
+            "Facebook",
+            "Meta",
+            "Google",
+            "Salesforce",
+            "Oracle",
+        ],
+        aggregate_redaction: bool = True,
+        **kwargs,
+    ) -> RestrictedTermsRecognitionResponse:
         """
         Guard against restricted terms and their variations.
         Args:
             text: Text to analyze
             custom_terms: List of restricted terms to check for
         Returns:
             RestrictedTermsRecognitionResponse containing safety assessment and detailed analysis
         """
         analysis = self.predict(text, custom_terms, **kwargs)
         # Create a summary of findings
         if analysis.contains_restricted_terms:
             summary_parts = ["Restricted terms detected:"]
             for match in analysis.detected_matches:
+                summary_parts.append(
+                    f"\n- {match.original_term}: {match.matched_text} ({match.match_type})"
+                )
             summary = "\n".join(summary_parts)
         else:
             summary = "No restricted terms detected."
         if self.should_anonymize and analysis.contains_restricted_terms:
             anonymized_text = text
             for match in analysis.detected_matches:
+                replacement = (
+                    "[redacted]"
+                    if aggregate_redaction
+                    else f"[{match.match_type.upper()}]"
+                )
+                anonymized_text = anonymized_text.replace(
+                    match.matched_text, replacement
+                )
         # Convert detected_matches to a dictionary format
         detected_entities = {}
             contains_entities=analysis.contains_restricted_terms,
             detected_entities=detected_entities,
             explanation=summary,
+            anonymized_text=anonymized_text,
+        )

guardrails_genie/guardrails/entity_recognition/pii_examples/pii_benchmark.py CHANGED Viewed

@@ -1,10 +1,11 @@
-from datasets import load_dataset
-from typing import Dict, List, Tuple
-import random
-from tqdm import tqdm
 import json
 from pathlib import Path
 import weave
 # Add this mapping dictionary near the top of the file
 PRESIDIO_TO_TRANSFORMER_MAPPING = {
@@ -32,66 +33,70 @@ PRESIDIO_TO_TRANSFORMER_MAPPING = {
     "CRYPTO": "ACCOUNTNUM",  # Cryptocurrency addresses
     "IBAN_CODE": "ACCOUNTNUM",
     "MEDICAL_LICENSE": "IDCARDNUM",
-    "IN_VEHICLE_REGISTRATION": "IDCARDNUM"
 }
-def load_ai4privacy_dataset(num_samples: int = 100, split: str = "validation") -> List[Dict]:
     """
     Load and prepare samples from the ai4privacy dataset.
     Args:
         num_samples: Number of samples to evaluate
         split: Dataset split to use ("train" or "validation")
     Returns:
         List of prepared test cases
     """
     # Load the dataset
     dataset = load_dataset("ai4privacy/pii-masking-400k")
     # Get the specified split
     data_split = dataset[split]
     # Randomly sample entries if num_samples is less than total
     if num_samples < len(data_split):
         indices = random.sample(range(len(data_split)), num_samples)
         samples = [data_split[i] for i in indices]
     else:
         samples = data_split
     # Convert to test case format
     test_cases = []
     for sample in samples:
         # Extract entities from privacy_mask
         entities: Dict[str, List[str]] = {}
-        for entity in sample['privacy_mask']:
-            label = entity['label']
-            value = entity['value']
             if label not in entities:
                 entities[label] = []
             entities[label].append(value)
         test_case = {
             "description": f"AI4Privacy Sample (ID: {sample['uid']})",
-            "input_text": sample['source_text'],
             "expected_entities": entities,
-            "masked_text": sample['masked_text'],
-            "language": sample['language'],
-            "locale": sample['locale']
         }
         test_cases.append(test_case)
     return test_cases
 @weave.op()
 def evaluate_model(guardrail, test_cases: List[Dict]) -> Tuple[Dict, List[Dict]]:
     """
     Evaluate a model on the test cases.
     Args:
         guardrail: Entity recognition guardrail to evaluate
         test_cases: List of test cases
     Returns:
         Tuple of (metrics dict, detailed results list)
     """
@@ -99,17 +104,17 @@ def evaluate_model(guardrail, test_cases: List[Dict]) -> Tuple[Dict, List[Dict]]
         "total": len(test_cases),
         "passed": 0,
         "failed": 0,
-        "entity_metrics": {}  # Will store precision/recall per entity type
     }
     detailed_results = []
     for test_case in tqdm(test_cases, desc="Evaluating samples"):
         # Run detection
-        result = guardrail.guard(test_case['input_text'])
         detected = result.detected_entities
-        expected = test_case['expected_entities']
         # Map Presidio entities if this is the Presidio guardrail
         if isinstance(guardrail, PresidioEntityRecognitionGuardrail):
             mapped_detected = {}
@@ -120,44 +125,62 @@ def evaluate_model(guardrail, test_cases: List[Dict]) -> Tuple[Dict, List[Dict]]
                         mapped_detected[mapped_type] = []
                     mapped_detected[mapped_type].extend(values)
             detected = mapped_detected
         # Track entity-level metrics
         all_entity_types = set(list(detected.keys()) + list(expected.keys()))
         entity_results = {}
         for entity_type in all_entity_types:
             detected_set = set(detected.get(entity_type, []))
             expected_set = set(expected.get(entity_type, []))
             # Calculate metrics
             true_positives = len(detected_set & expected_set)
             false_positives = len(detected_set - expected_set)
             false_negatives = len(expected_set - detected_set)
-            precision = true_positives / (true_positives + false_positives) if (true_positives + false_positives) > 0 else 0
-            recall = true_positives / (true_positives + false_negatives) if (true_positives + false_negatives) > 0 else 0
-            f1 = 2 * (precision * recall) / (precision + recall) if (precision + recall) > 0 else 0
             entity_results[entity_type] = {
                 "precision": precision,
                 "recall": recall,
                 "f1": f1,
                 "true_positives": true_positives,
                 "false_positives": false_positives,
-                "false_negatives": false_negatives
             }
             # Aggregate metrics
             if entity_type not in metrics["entity_metrics"]:
                 metrics["entity_metrics"][entity_type] = {
                     "total_true_positives": 0,
                     "total_false_positives": 0,
-                    "total_false_negatives": 0
                 }
-            metrics["entity_metrics"][entity_type]["total_true_positives"] += true_positives
-            metrics["entity_metrics"][entity_type]["total_false_positives"] += false_positives
-            metrics["entity_metrics"][entity_type]["total_false_negatives"] += false_negatives
         # Store detailed result
         detailed_result = {
             "id": test_case.get("description", ""),
@@ -167,69 +190,88 @@ def evaluate_model(guardrail, test_cases: List[Dict]) -> Tuple[Dict, List[Dict]]
             "expected_entities": expected,
             "detected_entities": detected,
             "entity_metrics": entity_results,
-            "anonymized_text": result.anonymized_text if result.anonymized_text else None
         }
         detailed_results.append(detailed_result)
         # Update pass/fail counts
         if all(entity_results[et]["f1"] == 1.0 for et in entity_results):
             metrics["passed"] += 1
         else:
             metrics["failed"] += 1
     # Calculate final entity metrics and track totals for overall metrics
     total_tp = 0
     total_fp = 0
     total_fn = 0
     for entity_type, counts in metrics["entity_metrics"].items():
         tp = counts["total_true_positives"]
         fp = counts["total_false_positives"]
         fn = counts["total_false_negatives"]
         total_tp += tp
         total_fp += fp
         total_fn += fn
         precision = tp / (tp + fp) if (tp + fp) > 0 else 0
         recall = tp / (tp + fn) if (tp + fn) > 0 else 0
-        f1 = 2 * (precision * recall) / (precision + recall) if (precision + recall) > 0 else 0
-        metrics["entity_metrics"][entity_type].update({
-            "precision": precision,
-            "recall": recall,
-            "f1": f1
-        })
     # Calculate overall metrics
-    overall_precision = total_tp / (total_tp + total_fp) if (total_tp + total_fp) > 0 else 0
-    overall_recall = total_tp / (total_tp + total_fn) if (total_tp + total_fn) > 0 else 0
-    overall_f1 = 2 * (overall_precision * overall_recall) / (overall_precision + overall_recall) if (overall_precision + overall_recall) > 0 else 0
     metrics["overall"] = {
         "precision": overall_precision,
         "recall": overall_recall,
         "f1": overall_f1,
         "total_true_positives": total_tp,
         "total_false_positives": total_fp,
-        "total_false_negatives": total_fn
     }
     return metrics, detailed_results
-def save_results(metrics: Dict, detailed_results: List[Dict], model_name: str, output_dir: str = "evaluation_results"):
     """Save evaluation results to files"""
     output_dir = Path(output_dir)
     output_dir.mkdir(exist_ok=True)
     # Save metrics summary
     with open(output_dir / f"{model_name}_metrics.json", "w") as f:
         json.dump(metrics, f, indent=2)
     # Save detailed results
     with open(output_dir / f"{model_name}_detailed_results.json", "w") as f:
         json.dump(detailed_results, f, indent=2)
 def print_metrics_summary(metrics: Dict):
     """Print a summary of the evaluation metrics"""
     print("\nEvaluation Summary")
@@ -238,7 +280,7 @@ def print_metrics_summary(metrics: Dict):
     print(f"Passed: {metrics['passed']}")
     print(f"Failed: {metrics['failed']}")
     print(f"Success Rate: {(metrics['passed']/metrics['total'])*100:.1f}%")
     # Print overall metrics
     print("\nOverall Metrics:")
     print("-" * 80)
@@ -247,40 +289,56 @@ def print_metrics_summary(metrics: Dict):
     print(f"{'Precision':<20} {metrics['overall']['precision']:>10.2f}")
     print(f"{'Recall':<20} {metrics['overall']['recall']:>10.2f}")
     print(f"{'F1':<20} {metrics['overall']['f1']:>10.2f}")
     print("\nEntity-level Metrics:")
     print("-" * 80)
     print(f"{'Entity Type':<20} {'Precision':>10} {'Recall':>10} {'F1':>10}")
     print("-" * 80)
     for entity_type, entity_metrics in metrics["entity_metrics"].items():
-        print(f"{entity_type:<20} {entity_metrics['precision']:>10.2f} {entity_metrics['recall']:>10.2f} {entity_metrics['f1']:>10.2f}")
 def main():
     """Main evaluation function"""
     weave.init("guardrails-genie-pii-evaluation-demo")
     # Load test cases
     test_cases = load_ai4privacy_dataset(num_samples=100)
     # Initialize models to evaluate
     models = {
-        "regex": RegexEntityRecognitionGuardrail(should_anonymize=True, show_available_entities=True),
-        "presidio": PresidioEntityRecognitionGuardrail(should_anonymize=True, show_available_entities=True),
-        "transformers": TransformersEntityRecognitionGuardrail(should_anonymize=True, show_available_entities=True)
     }
     # Evaluate each model
     for model_name, guardrail in models.items():
         print(f"\nEvaluating {model_name} model...")
         metrics, detailed_results = evaluate_model(guardrail, test_cases)
         # Print and save results
         print_metrics_summary(metrics)
         save_results(metrics, detailed_results, model_name)
 if __name__ == "__main__":
-    from guardrails_genie.guardrails.entity_recognition.regex_entity_recognition_guardrail import RegexEntityRecognitionGuardrail
-    from guardrails_genie.guardrails.entity_recognition.presidio_entity_recognition_guardrail import PresidioEntityRecognitionGuardrail
-    from guardrails_genie.guardrails.entity_recognition.transformers_entity_recognition_guardrail import TransformersEntityRecognitionGuardrail
-    main()

 import json
+import random
 from pathlib import Path
+from typing import Dict, List, Tuple
 import weave
+from datasets import load_dataset
+from tqdm import tqdm
 # Add this mapping dictionary near the top of the file
 PRESIDIO_TO_TRANSFORMER_MAPPING = {
     "CRYPTO": "ACCOUNTNUM",  # Cryptocurrency addresses
     "IBAN_CODE": "ACCOUNTNUM",
     "MEDICAL_LICENSE": "IDCARDNUM",
+    "IN_VEHICLE_REGISTRATION": "IDCARDNUM",
 }
+def load_ai4privacy_dataset(
+    num_samples: int = 100, split: str = "validation"
+) -> List[Dict]:
     """
     Load and prepare samples from the ai4privacy dataset.
     Args:
         num_samples: Number of samples to evaluate
         split: Dataset split to use ("train" or "validation")
     Returns:
         List of prepared test cases
     """
     # Load the dataset
     dataset = load_dataset("ai4privacy/pii-masking-400k")
     # Get the specified split
     data_split = dataset[split]
     # Randomly sample entries if num_samples is less than total
     if num_samples < len(data_split):
         indices = random.sample(range(len(data_split)), num_samples)
         samples = [data_split[i] for i in indices]
     else:
         samples = data_split
     # Convert to test case format
     test_cases = []
     for sample in samples:
         # Extract entities from privacy_mask
         entities: Dict[str, List[str]] = {}
+        for entity in sample["privacy_mask"]:
+            label = entity["label"]
+            value = entity["value"]
             if label not in entities:
                 entities[label] = []
             entities[label].append(value)
         test_case = {
             "description": f"AI4Privacy Sample (ID: {sample['uid']})",
+            "input_text": sample["source_text"],
             "expected_entities": entities,
+            "masked_text": sample["masked_text"],
+            "language": sample["language"],
+            "locale": sample["locale"],
         }
         test_cases.append(test_case)
     return test_cases
 @weave.op()
 def evaluate_model(guardrail, test_cases: List[Dict]) -> Tuple[Dict, List[Dict]]:
     """
     Evaluate a model on the test cases.
     Args:
         guardrail: Entity recognition guardrail to evaluate
         test_cases: List of test cases
     Returns:
         Tuple of (metrics dict, detailed results list)
     """
         "total": len(test_cases),
         "passed": 0,
         "failed": 0,
+        "entity_metrics": {},  # Will store precision/recall per entity type
     }
     detailed_results = []
     for test_case in tqdm(test_cases, desc="Evaluating samples"):
         # Run detection
+        result = guardrail.guard(test_case["input_text"])
         detected = result.detected_entities
+        expected = test_case["expected_entities"]
         # Map Presidio entities if this is the Presidio guardrail
         if isinstance(guardrail, PresidioEntityRecognitionGuardrail):
             mapped_detected = {}
                         mapped_detected[mapped_type] = []
                     mapped_detected[mapped_type].extend(values)
             detected = mapped_detected
         # Track entity-level metrics
         all_entity_types = set(list(detected.keys()) + list(expected.keys()))
         entity_results = {}
         for entity_type in all_entity_types:
             detected_set = set(detected.get(entity_type, []))
             expected_set = set(expected.get(entity_type, []))
             # Calculate metrics
             true_positives = len(detected_set & expected_set)
             false_positives = len(detected_set - expected_set)
             false_negatives = len(expected_set - detected_set)
+            precision = (
+                true_positives / (true_positives + false_positives)
+                if (true_positives + false_positives) > 0
+                else 0
+            )
+            recall = (
+                true_positives / (true_positives + false_negatives)
+                if (true_positives + false_negatives) > 0
+                else 0
+            )
+            f1 = (
+                2 * (precision * recall) / (precision + recall)
+                if (precision + recall) > 0
+                else 0
+            )
             entity_results[entity_type] = {
                 "precision": precision,
                 "recall": recall,
                 "f1": f1,
                 "true_positives": true_positives,
                 "false_positives": false_positives,
+                "false_negatives": false_negatives,
             }
             # Aggregate metrics
             if entity_type not in metrics["entity_metrics"]:
                 metrics["entity_metrics"][entity_type] = {
                     "total_true_positives": 0,
                     "total_false_positives": 0,
+                    "total_false_negatives": 0,
                 }
+            metrics["entity_metrics"][entity_type][
+                "total_true_positives"
+            ] += true_positives
+            metrics["entity_metrics"][entity_type][
+                "total_false_positives"
+            ] += false_positives
+            metrics["entity_metrics"][entity_type][
+                "total_false_negatives"
+            ] += false_negatives
         # Store detailed result
         detailed_result = {
             "id": test_case.get("description", ""),
             "expected_entities": expected,
             "detected_entities": detected,
             "entity_metrics": entity_results,
+            "anonymized_text": (
+                result.anonymized_text if result.anonymized_text else None
+            ),
         }
         detailed_results.append(detailed_result)
         # Update pass/fail counts
         if all(entity_results[et]["f1"] == 1.0 for et in entity_results):
             metrics["passed"] += 1
         else:
             metrics["failed"] += 1
     # Calculate final entity metrics and track totals for overall metrics
     total_tp = 0
     total_fp = 0
     total_fn = 0
     for entity_type, counts in metrics["entity_metrics"].items():
         tp = counts["total_true_positives"]
         fp = counts["total_false_positives"]
         fn = counts["total_false_negatives"]
         total_tp += tp
         total_fp += fp
         total_fn += fn
         precision = tp / (tp + fp) if (tp + fp) > 0 else 0
         recall = tp / (tp + fn) if (tp + fn) > 0 else 0
+        f1 = (
+            2 * (precision * recall) / (precision + recall)
+            if (precision + recall) > 0
+            else 0
+        )
+        metrics["entity_metrics"][entity_type].update(
+            {"precision": precision, "recall": recall, "f1": f1}
+        )
     # Calculate overall metrics
+    overall_precision = (
+        total_tp / (total_tp + total_fp) if (total_tp + total_fp) > 0 else 0
+    )
+    overall_recall = (
+        total_tp / (total_tp + total_fn) if (total_tp + total_fn) > 0 else 0
+    )
+    overall_f1 = (
+        2 * (overall_precision * overall_recall) / (overall_precision + overall_recall)
+        if (overall_precision + overall_recall) > 0
+        else 0
+    )
     metrics["overall"] = {
         "precision": overall_precision,
         "recall": overall_recall,
         "f1": overall_f1,
         "total_true_positives": total_tp,
         "total_false_positives": total_fp,
+        "total_false_negatives": total_fn,
     }
     return metrics, detailed_results
+def save_results(
+    metrics: Dict,
+    detailed_results: List[Dict],
+    model_name: str,
+    output_dir: str = "evaluation_results",
+):
     """Save evaluation results to files"""
     output_dir = Path(output_dir)
     output_dir.mkdir(exist_ok=True)
     # Save metrics summary
     with open(output_dir / f"{model_name}_metrics.json", "w") as f:
         json.dump(metrics, f, indent=2)
     # Save detailed results
     with open(output_dir / f"{model_name}_detailed_results.json", "w") as f:
         json.dump(detailed_results, f, indent=2)
 def print_metrics_summary(metrics: Dict):
     """Print a summary of the evaluation metrics"""
     print("\nEvaluation Summary")
     print(f"Passed: {metrics['passed']}")
     print(f"Failed: {metrics['failed']}")
     print(f"Success Rate: {(metrics['passed']/metrics['total'])*100:.1f}%")
     # Print overall metrics
     print("\nOverall Metrics:")
     print("-" * 80)
     print(f"{'Precision':<20} {metrics['overall']['precision']:>10.2f}")
     print(f"{'Recall':<20} {metrics['overall']['recall']:>10.2f}")
     print(f"{'F1':<20} {metrics['overall']['f1']:>10.2f}")
     print("\nEntity-level Metrics:")
     print("-" * 80)
     print(f"{'Entity Type':<20} {'Precision':>10} {'Recall':>10} {'F1':>10}")
     print("-" * 80)
     for entity_type, entity_metrics in metrics["entity_metrics"].items():
+        print(
+            f"{entity_type:<20} {entity_metrics['precision']:>10.2f} {entity_metrics['recall']:>10.2f} {entity_metrics['f1']:>10.2f}"
+        )
 def main():
     """Main evaluation function"""
     weave.init("guardrails-genie-pii-evaluation-demo")
     # Load test cases
     test_cases = load_ai4privacy_dataset(num_samples=100)
     # Initialize models to evaluate
     models = {
+        "regex": RegexEntityRecognitionGuardrail(
+            should_anonymize=True, show_available_entities=True
+        ),
+        "presidio": PresidioEntityRecognitionGuardrail(
+            should_anonymize=True, show_available_entities=True
+        ),
+        "transformers": TransformersEntityRecognitionGuardrail(
+            should_anonymize=True, show_available_entities=True
+        ),
     }
     # Evaluate each model
     for model_name, guardrail in models.items():
         print(f"\nEvaluating {model_name} model...")
         metrics, detailed_results = evaluate_model(guardrail, test_cases)
         # Print and save results
         print_metrics_summary(metrics)
         save_results(metrics, detailed_results, model_name)
 if __name__ == "__main__":
+    from guardrails_genie.guardrails.entity_recognition.presidio_entity_recognition_guardrail import (
+        PresidioEntityRecognitionGuardrail,
+    )
+    from guardrails_genie.guardrails.entity_recognition.regex_entity_recognition_guardrail import (
+        RegexEntityRecognitionGuardrail,
+    )
+    from guardrails_genie.guardrails.entity_recognition.transformers_entity_recognition_guardrail import (
+        TransformersEntityRecognitionGuardrail,
+    )
+    main()

guardrails_genie/guardrails/entity_recognition/pii_examples/pii_benchmark_weave.py CHANGED Viewed

@@ -1,13 +1,13 @@
-from datasets import load_dataset
-from typing import Dict, List, Tuple, Optional
-import random
-from tqdm import tqdm
 import json
 from pathlib import Path
 import weave
-from weave.scorers import Scorer
 from weave import Evaluation
-import asyncio
 # Add this mapping dictionary near the top of the file
 PRESIDIO_TO_TRANSFORMER_MAPPING = {
@@ -35,26 +35,29 @@ PRESIDIO_TO_TRANSFORMER_MAPPING = {
     "CRYPTO": "ACCOUNTNUM",  # Cryptocurrency addresses
     "IBAN_CODE": "ACCOUNTNUM",
     "MEDICAL_LICENSE": "IDCARDNUM",
-    "IN_VEHICLE_REGISTRATION": "IDCARDNUM"
 }
 class EntityRecognitionScorer(Scorer):
     """Scorer for evaluating entity recognition performance"""
     @weave.op()
-    async def score(self, model_output: Optional[dict], input_text: str, expected_entities: Dict) -> Dict:
         """Score entity recognition results"""
         if not model_output:
             return {"f1": 0.0}
         # Convert Pydantic model to dict if necessary
         if hasattr(model_output, "model_dump"):
             model_output = model_output.model_dump()
         elif hasattr(model_output, "dict"):
             model_output = model_output.dict()
         detected = model_output.get("detected_entities", {})
         # Map Presidio entities if needed
         if model_output.get("model_type") == "presidio":
             mapped_detected = {}
@@ -65,191 +68,234 @@ class EntityRecognitionScorer(Scorer):
                         mapped_detected[mapped_type] = []
                     mapped_detected[mapped_type].extend(values)
             detected = mapped_detected
         # Track entity-level metrics
         all_entity_types = set(list(detected.keys()) + list(expected_entities.keys()))
         entity_metrics = {}
         for entity_type in all_entity_types:
             detected_set = set(detected.get(entity_type, []))
             expected_set = set(expected_entities.get(entity_type, []))
             # Calculate metrics
             true_positives = len(detected_set & expected_set)
             false_positives = len(detected_set - expected_set)
             false_negatives = len(expected_set - detected_set)
             if entity_type not in entity_metrics:
                 entity_metrics[entity_type] = {
                     "total_true_positives": 0,
                     "total_false_positives": 0,
-                    "total_false_negatives": 0
                 }
             entity_metrics[entity_type]["total_true_positives"] += true_positives
             entity_metrics[entity_type]["total_false_positives"] += false_positives
             entity_metrics[entity_type]["total_false_negatives"] += false_negatives
             # Calculate per-entity metrics
-            precision = true_positives / (true_positives + false_positives) if (true_positives + false_positives) > 0 else 0
-            recall = true_positives / (true_positives + false_negatives) if (true_positives + false_negatives) > 0 else 0
-            f1 = 2 * (precision * recall) / (precision + recall) if (precision + recall) > 0 else 0
-            entity_metrics[entity_type].update({
-                "precision": precision,
-                "recall": recall,
-                "f1": f1
-            })
         # Calculate overall metrics
-        total_tp = sum(metrics["total_true_positives"] for metrics in entity_metrics.values())
-        total_fp = sum(metrics["total_false_positives"] for metrics in entity_metrics.values())
-        total_fn = sum(metrics["total_false_negatives"] for metrics in entity_metrics.values())
-        overall_precision = total_tp / (total_tp + total_fp) if (total_tp + total_fp) > 0 else 0
-        overall_recall = total_tp / (total_tp + total_fn) if (total_tp + total_fn) > 0 else 0
-        overall_f1 = 2 * (overall_precision * overall_recall) / (overall_precision + overall_recall) if (overall_precision + overall_recall) > 0 else 0
         entity_metrics["overall"] = {
             "precision": overall_precision,
             "recall": overall_recall,
             "f1": overall_f1,
             "total_true_positives": total_tp,
             "total_false_positives": total_fp,
-            "total_false_negatives": total_fn
         }
         return entity_metrics
-def load_ai4privacy_dataset(num_samples: int = 100, split: str = "validation") -> List[Dict]:
     """
     Load and prepare samples from the ai4privacy dataset.
     Args:
         num_samples: Number of samples to evaluate
         split: Dataset split to use ("train" or "validation")
     Returns:
         List of prepared test cases
     """
     # Load the dataset
     dataset = load_dataset("ai4privacy/pii-masking-400k")
     # Get the specified split
     data_split = dataset[split]
     # Randomly sample entries if num_samples is less than total
     if num_samples < len(data_split):
         indices = random.sample(range(len(data_split)), num_samples)
         samples = [data_split[i] for i in indices]
     else:
         samples = data_split
     # Convert to test case format
     test_cases = []
     for sample in samples:
         # Extract entities from privacy_mask
         entities: Dict[str, List[str]] = {}
-        for entity in sample['privacy_mask']:
-            label = entity['label']
-            value = entity['value']
             if label not in entities:
                 entities[label] = []
             entities[label].append(value)
         test_case = {
             "description": f"AI4Privacy Sample (ID: {sample['uid']})",
-            "input_text": sample['source_text'],
             "expected_entities": entities,
-            "masked_text": sample['masked_text'],
-            "language": sample['language'],
-            "locale": sample['locale']
         }
         test_cases.append(test_case)
     return test_cases
-def save_results(weave_results: Dict, model_name: str, output_dir: str = "evaluation_results"):
     """Save evaluation results to files"""
     output_dir = Path(output_dir)
     output_dir.mkdir(exist_ok=True)
     # Extract and process results
     scorer_results = weave_results.get("EntityRecognitionScorer", [])
     if not scorer_results or all(r is None for r in scorer_results):
         print(f"No valid results to save for {model_name}")
         return
     # Calculate summary metrics
     total_samples = len(scorer_results)
     passed = sum(1 for r in scorer_results if r is not None and not isinstance(r, str))
     # Aggregate entity-level metrics
     entity_metrics = {}
     for result in scorer_results:
         try:
             if isinstance(result, str) or not result:
                 continue
             for entity_type, metrics in result.items():
                 if entity_type not in entity_metrics:
                     entity_metrics[entity_type] = {
                         "precision": [],
                         "recall": [],
-                        "f1": []
                     }
                 entity_metrics[entity_type]["precision"].append(metrics["precision"])
                 entity_metrics[entity_type]["recall"].append(metrics["recall"])
                 entity_metrics[entity_type]["f1"].append(metrics["f1"])
         except (AttributeError, TypeError, KeyError):
             continue
     # Calculate averages
     summary_metrics = {
         "total": total_samples,
         "passed": passed,
         "failed": total_samples - passed,
-        "success_rate": (passed/total_samples) if total_samples > 0 else 0,
         "entity_metrics": {
             entity_type: {
-                "precision": sum(metrics["precision"]) / len(metrics["precision"]) if metrics["precision"] else 0,
-                "recall": sum(metrics["recall"]) / len(metrics["recall"]) if metrics["recall"] else 0,
-                "f1": sum(metrics["f1"]) / len(metrics["f1"]) if metrics["f1"] else 0
             }
             for entity_type, metrics in entity_metrics.items()
-        }
     }
     # Save files
     with open(output_dir / f"{model_name}_metrics.json", "w") as f:
         json.dump(summary_metrics, f, indent=2)
     # Save detailed results, filtering out string results
-    detailed_results = [r for r in scorer_results if not isinstance(r, str) and r is not None]
     with open(output_dir / f"{model_name}_detailed_results.json", "w") as f:
         json.dump(detailed_results, f, indent=2)
 def print_metrics_summary(weave_results: Dict):
     """Print a summary of the evaluation metrics"""
     print("\nEvaluation Summary")
     print("=" * 80)
     # Extract results from Weave's evaluation format
     scorer_results = weave_results.get("EntityRecognitionScorer", {})
     if not scorer_results:
         print("No valid results available")
         return
     # Calculate overall metrics
     total_samples = int(weave_results.get("model_latency", {}).get("count", 0))
     passed = total_samples  # Since we have results, all samples passed
     failed = 0
     print(f"Total Samples: {total_samples}")
     print(f"Passed: {passed}")
     print(f"Failed: {failed}")
     print(f"Success Rate: {(passed/total_samples)*100:.2f}%")
     # Print overall metrics
     if "overall" in scorer_results:
         overall = scorer_results["overall"]
@@ -260,63 +306,68 @@ def print_metrics_summary(weave_results: Dict):
         print(f"{'Precision':<20} {overall['precision']['mean']:>10.2f}")
         print(f"{'Recall':<20} {overall['recall']['mean']:>10.2f}")
         print(f"{'F1':<20} {overall['f1']['mean']:>10.2f}")
     # Print entity-level metrics
     print("\nEntity-Level Metrics:")
     print("-" * 80)
     print(f"{'Entity Type':<20} {'Precision':>10} {'Recall':>10} {'F1':>10}")
     print("-" * 80)
     for entity_type, metrics in scorer_results.items():
         if entity_type == "overall":
             continue
         precision = metrics.get("precision", {}).get("mean", 0)
         recall = metrics.get("recall", {}).get("mean", 0)
         f1 = metrics.get("f1", {}).get("mean", 0)
         print(f"{entity_type:<20} {precision:>10.2f} {recall:>10.2f} {f1:>10.2f}")
 def preprocess_model_input(example: Dict) -> Dict:
     """Preprocess dataset example to match model input format."""
     return {
         "prompt": example["input_text"],
-        "model_type": example.get("model_type", "unknown")  # Add model type for Presidio mapping
     }
 def main():
     """Main evaluation function"""
     weave.init("guardrails-genie-pii-evaluation")
     # Load test cases
     test_cases = load_ai4privacy_dataset(num_samples=100)
     # Add model type to test cases for Presidio mapping
     models = {
         # "regex": RegexEntityRecognitionGuardrail(should_anonymize=True),
         "presidio": PresidioEntityRecognitionGuardrail(should_anonymize=True),
         # "transformers": TransformersEntityRecognitionGuardrail(should_anonymize=True)
     }
     scorer = EntityRecognitionScorer()
     # Evaluate each model
     for model_name, guardrail in models.items():
         print(f"\nEvaluating {model_name} model...")
         # Add model type to test cases
         model_test_cases = [{**case, "model_type": model_name} for case in test_cases]
         evaluation = Evaluation(
             dataset=model_test_cases,
             scorers=[scorer],
-            preprocess_model_input=preprocess_model_input
         )
         results = asyncio.run(evaluation.evaluate(guardrail))
 if __name__ == "__main__":
-    from guardrails_genie.guardrails.entity_recognition.regex_entity_recognition_guardrail import RegexEntityRecognitionGuardrail
-    from guardrails_genie.guardrails.entity_recognition.presidio_entity_recognition_guardrail import PresidioEntityRecognitionGuardrail
-    from guardrails_genie.guardrails.entity_recognition.transformers_entity_recognition_guardrail import TransformersEntityRecognitionGuardrail
-    main()

+import asyncio
 import json
+import random
 from pathlib import Path
+from typing import Dict, List, Optional
 import weave
+from datasets import load_dataset
 from weave import Evaluation
+from weave.scorers import Scorer
 # Add this mapping dictionary near the top of the file
 PRESIDIO_TO_TRANSFORMER_MAPPING = {
     "CRYPTO": "ACCOUNTNUM",  # Cryptocurrency addresses
     "IBAN_CODE": "ACCOUNTNUM",
     "MEDICAL_LICENSE": "IDCARDNUM",
+    "IN_VEHICLE_REGISTRATION": "IDCARDNUM",
 }
 class EntityRecognitionScorer(Scorer):
     """Scorer for evaluating entity recognition performance"""
     @weave.op()
+    async def score(
+        self, model_output: Optional[dict], input_text: str, expected_entities: Dict
+    ) -> Dict:
         """Score entity recognition results"""
         if not model_output:
             return {"f1": 0.0}
         # Convert Pydantic model to dict if necessary
         if hasattr(model_output, "model_dump"):
             model_output = model_output.model_dump()
         elif hasattr(model_output, "dict"):
             model_output = model_output.dict()
         detected = model_output.get("detected_entities", {})
         # Map Presidio entities if needed
         if model_output.get("model_type") == "presidio":
             mapped_detected = {}
                         mapped_detected[mapped_type] = []
                     mapped_detected[mapped_type].extend(values)
             detected = mapped_detected
         # Track entity-level metrics
         all_entity_types = set(list(detected.keys()) + list(expected_entities.keys()))
         entity_metrics = {}
         for entity_type in all_entity_types:
             detected_set = set(detected.get(entity_type, []))
             expected_set = set(expected_entities.get(entity_type, []))
             # Calculate metrics
             true_positives = len(detected_set & expected_set)
             false_positives = len(detected_set - expected_set)
             false_negatives = len(expected_set - detected_set)
             if entity_type not in entity_metrics:
                 entity_metrics[entity_type] = {
                     "total_true_positives": 0,
                     "total_false_positives": 0,
+                    "total_false_negatives": 0,
                 }
             entity_metrics[entity_type]["total_true_positives"] += true_positives
             entity_metrics[entity_type]["total_false_positives"] += false_positives
             entity_metrics[entity_type]["total_false_negatives"] += false_negatives
             # Calculate per-entity metrics
+            precision = (
+                true_positives / (true_positives + false_positives)
+                if (true_positives + false_positives) > 0
+                else 0
+            )
+            recall = (
+                true_positives / (true_positives + false_negatives)
+                if (true_positives + false_negatives) > 0
+                else 0
+            )
+            f1 = (
+                2 * (precision * recall) / (precision + recall)
+                if (precision + recall) > 0
+                else 0
+            )
+            entity_metrics[entity_type].update(
+                {"precision": precision, "recall": recall, "f1": f1}
+            )
         # Calculate overall metrics
+        total_tp = sum(
+            metrics["total_true_positives"] for metrics in entity_metrics.values()
+        )
+        total_fp = sum(
+            metrics["total_false_positives"] for metrics in entity_metrics.values()
+        )
+        total_fn = sum(
+            metrics["total_false_negatives"] for metrics in entity_metrics.values()
+        )
+        overall_precision = (
+            total_tp / (total_tp + total_fp) if (total_tp + total_fp) > 0 else 0
+        )
+        overall_recall = (
+            total_tp / (total_tp + total_fn) if (total_tp + total_fn) > 0 else 0
+        )
+        overall_f1 = (
+            2
+            * (overall_precision * overall_recall)
+            / (overall_precision + overall_recall)
+            if (overall_precision + overall_recall) > 0
+            else 0
+        )
         entity_metrics["overall"] = {
             "precision": overall_precision,
             "recall": overall_recall,
             "f1": overall_f1,
             "total_true_positives": total_tp,
             "total_false_positives": total_fp,
+            "total_false_negatives": total_fn,
         }
         return entity_metrics
+def load_ai4privacy_dataset(
+    num_samples: int = 100, split: str = "validation"
+) -> List[Dict]:
     """
     Load and prepare samples from the ai4privacy dataset.
     Args:
         num_samples: Number of samples to evaluate
         split: Dataset split to use ("train" or "validation")
     Returns:
         List of prepared test cases
     """
     # Load the dataset
     dataset = load_dataset("ai4privacy/pii-masking-400k")
     # Get the specified split
     data_split = dataset[split]
     # Randomly sample entries if num_samples is less than total
     if num_samples < len(data_split):
         indices = random.sample(range(len(data_split)), num_samples)
         samples = [data_split[i] for i in indices]
     else:
         samples = data_split
     # Convert to test case format
     test_cases = []
     for sample in samples:
         # Extract entities from privacy_mask
         entities: Dict[str, List[str]] = {}
+        for entity in sample["privacy_mask"]:
+            label = entity["label"]
+            value = entity["value"]
             if label not in entities:
                 entities[label] = []
             entities[label].append(value)
         test_case = {
             "description": f"AI4Privacy Sample (ID: {sample['uid']})",
+            "input_text": sample["source_text"],
             "expected_entities": entities,
+            "masked_text": sample["masked_text"],
+            "language": sample["language"],
+            "locale": sample["locale"],
         }
         test_cases.append(test_case)
     return test_cases
+def save_results(
+    weave_results: Dict, model_name: str, output_dir: str = "evaluation_results"
+):
     """Save evaluation results to files"""
     output_dir = Path(output_dir)
     output_dir.mkdir(exist_ok=True)
     # Extract and process results
     scorer_results = weave_results.get("EntityRecognitionScorer", [])
     if not scorer_results or all(r is None for r in scorer_results):
         print(f"No valid results to save for {model_name}")
         return
     # Calculate summary metrics
     total_samples = len(scorer_results)
     passed = sum(1 for r in scorer_results if r is not None and not isinstance(r, str))
     # Aggregate entity-level metrics
     entity_metrics = {}
     for result in scorer_results:
         try:
             if isinstance(result, str) or not result:
                 continue
             for entity_type, metrics in result.items():
                 if entity_type not in entity_metrics:
                     entity_metrics[entity_type] = {
                         "precision": [],
                         "recall": [],
+                        "f1": [],
                     }
                 entity_metrics[entity_type]["precision"].append(metrics["precision"])
                 entity_metrics[entity_type]["recall"].append(metrics["recall"])
                 entity_metrics[entity_type]["f1"].append(metrics["f1"])
         except (AttributeError, TypeError, KeyError):
             continue
     # Calculate averages
     summary_metrics = {
         "total": total_samples,
         "passed": passed,
         "failed": total_samples - passed,
+        "success_rate": (passed / total_samples) if total_samples > 0 else 0,
         "entity_metrics": {
             entity_type: {
+                "precision": (
+                    sum(metrics["precision"]) / len(metrics["precision"])
+                    if metrics["precision"]
+                    else 0
+                ),
+                "recall": (
+                    sum(metrics["recall"]) / len(metrics["recall"])
+                    if metrics["recall"]
+                    else 0
+                ),
+                "f1": sum(metrics["f1"]) / len(metrics["f1"]) if metrics["f1"] else 0,
             }
             for entity_type, metrics in entity_metrics.items()
+        },
     }
     # Save files
     with open(output_dir / f"{model_name}_metrics.json", "w") as f:
         json.dump(summary_metrics, f, indent=2)
     # Save detailed results, filtering out string results
+    detailed_results = [
+        r for r in scorer_results if not isinstance(r, str) and r is not None
+    ]
     with open(output_dir / f"{model_name}_detailed_results.json", "w") as f:
         json.dump(detailed_results, f, indent=2)
 def print_metrics_summary(weave_results: Dict):
     """Print a summary of the evaluation metrics"""
     print("\nEvaluation Summary")
     print("=" * 80)
     # Extract results from Weave's evaluation format
     scorer_results = weave_results.get("EntityRecognitionScorer", {})
     if not scorer_results:
         print("No valid results available")
         return
     # Calculate overall metrics
     total_samples = int(weave_results.get("model_latency", {}).get("count", 0))
     passed = total_samples  # Since we have results, all samples passed
     failed = 0
     print(f"Total Samples: {total_samples}")
     print(f"Passed: {passed}")
     print(f"Failed: {failed}")
     print(f"Success Rate: {(passed/total_samples)*100:.2f}%")
     # Print overall metrics
     if "overall" in scorer_results:
         overall = scorer_results["overall"]
         print(f"{'Precision':<20} {overall['precision']['mean']:>10.2f}")
         print(f"{'Recall':<20} {overall['recall']['mean']:>10.2f}")
         print(f"{'F1':<20} {overall['f1']['mean']:>10.2f}")
     # Print entity-level metrics
     print("\nEntity-Level Metrics:")
     print("-" * 80)
     print(f"{'Entity Type':<20} {'Precision':>10} {'Recall':>10} {'F1':>10}")
     print("-" * 80)
     for entity_type, metrics in scorer_results.items():
         if entity_type == "overall":
             continue
         precision = metrics.get("precision", {}).get("mean", 0)
         recall = metrics.get("recall", {}).get("mean", 0)
         f1 = metrics.get("f1", {}).get("mean", 0)
         print(f"{entity_type:<20} {precision:>10.2f} {recall:>10.2f} {f1:>10.2f}")
 def preprocess_model_input(example: Dict) -> Dict:
     """Preprocess dataset example to match model input format."""
     return {
         "prompt": example["input_text"],
+        "model_type": example.get(
+            "model_type", "unknown"
+        ),  # Add model type for Presidio mapping
     }
 def main():
     """Main evaluation function"""
     weave.init("guardrails-genie-pii-evaluation")
     # Load test cases
     test_cases = load_ai4privacy_dataset(num_samples=100)
     # Add model type to test cases for Presidio mapping
     models = {
         # "regex": RegexEntityRecognitionGuardrail(should_anonymize=True),
         "presidio": PresidioEntityRecognitionGuardrail(should_anonymize=True),
         # "transformers": TransformersEntityRecognitionGuardrail(should_anonymize=True)
     }
     scorer = EntityRecognitionScorer()
     # Evaluate each model
     for model_name, guardrail in models.items():
         print(f"\nEvaluating {model_name} model...")
         # Add model type to test cases
         model_test_cases = [{**case, "model_type": model_name} for case in test_cases]
         evaluation = Evaluation(
             dataset=model_test_cases,
             scorers=[scorer],
+            preprocess_model_input=preprocess_model_input,
         )
         results = asyncio.run(evaluation.evaluate(guardrail))
 if __name__ == "__main__":
+    from guardrails_genie.guardrails.entity_recognition.presidio_entity_recognition_guardrail import (
+        PresidioEntityRecognitionGuardrail,
+    )
+    main()

guardrails_genie/guardrails/entity_recognition/pii_examples/pii_test_examples.py CHANGED Viewed

@@ -18,8 +18,8 @@ Emergency Contact: Mary Johnson (Tel: 098-765-4321)
             "SURNAME": ["Smith", "Johnson"],
             "EMAIL": ["[email protected]"],
             "PHONE_NUMBER": ["123-456-7890", "098-765-4321"],
-            "SOCIALNUM": ["123-45-6789"]
-        }
     },
     {
         "description": "Meeting Notes with Attendees",
@@ -39,8 +39,8 @@ Action Items:
             "GIVENNAME": ["Sarah", "Robert", "Tom", "Bob"],
             "SURNAME": ["Williams", "Brown", "Wilson"],
             "EMAIL": ["[email protected]", "[email protected]"],
-            "PHONE_NUMBER": ["555-0123-4567", "777-888-9999"]
-        }
     },
     {
         "description": "Medical Record",
@@ -57,8 +57,8 @@ Emergency Contact: Michael Thompson (555-123-4567)
             "GIVENNAME": ["Emma", "James", "Michael"],
             "SURNAME": ["Thompson", "Wilson", "Thompson"],
             "EMAIL": ["[email protected]"],
-            "PHONE_NUMBER": ["555-123-4567"]
-        }
     },
     {
         "description": "No PII Content",
@@ -68,7 +68,7 @@ Project Status Update:
 - Budget is within limits
 - Next review scheduled for next week
 """,
-        "expected_entities": {}
     },
     {
         "description": "Mixed Format Phone Numbers",
@@ -84,10 +84,10 @@ Emergency: 555 444 3333
                 "(555) 123-4567",
                 "555.987.6543",
                 "+1-555-321-7890",
-                "555 444 3333"
             ]
-        }
-    }
 ]
 # Additional examples can be added to test specific edge cases or formats
@@ -103,37 +103,41 @@ [email protected]
             "EMAIL": [
                 "[email protected]",
                 "[email protected]",
-                "[email protected]"
             ],
             "GIVENNAME": ["John", "Jane", "Bob"],
-            "SURNAME": ["Doe", "Smith", "Jones"]
-        }
     }
 ]
 def validate_entities(detected: dict, expected: dict) -> bool:
     """Compare detected entities with expected entities"""
     if set(detected.keys()) != set(expected.keys()):
         return False
     return all(set(detected[k]) == set(expected[k]) for k in expected.keys())
 def run_test_case(guardrail, test_case, test_type="Main"):
     """Run a single test case and print results"""
     print(f"\n{test_type} Test Case: {test_case['description']}")
     print("-" * 50)
-    result = guardrail.guard(test_case['input_text'])
-    expected = test_case['expected_entities']
     # Validate results
     matches = validate_entities(result.detected_entities, expected)
     print(f"Test Status: {'✓ PASS' if matches else '✗ FAIL'}")
     print(f"Contains PII: {result.contains_entities}")
     if not matches:
         print("\nEntity Comparison:")
-        all_entity_types = set(list(result.detected_entities.keys()) + list(expected.keys()))
         for entity_type in all_entity_types:
             detected = set(result.detected_entities.get(entity_type, []))
             expected_set = set(expected.get(entity_type, []))
@@ -143,8 +147,8 @@ def run_test_case(guardrail, test_case, test_type="Main"):
             if detected != expected_set:
                 print(f"  Missing: {sorted(expected_set - detected)}")
                 print(f"  Extra: {sorted(detected - expected_set)}")
     if result.anonymized_text:
         print(f"\nAnonymized Text:\n{result.anonymized_text}")
-    return matches

             "SURNAME": ["Smith", "Johnson"],
             "EMAIL": ["[email protected]"],
             "PHONE_NUMBER": ["123-456-7890", "098-765-4321"],
+            "SOCIALNUM": ["123-45-6789"],
+        },
     },
     {
         "description": "Meeting Notes with Attendees",
             "GIVENNAME": ["Sarah", "Robert", "Tom", "Bob"],
             "SURNAME": ["Williams", "Brown", "Wilson"],
             "EMAIL": ["[email protected]", "[email protected]"],
+            "PHONE_NUMBER": ["555-0123-4567", "777-888-9999"],
+        },
     },
     {
         "description": "Medical Record",
             "GIVENNAME": ["Emma", "James", "Michael"],
             "SURNAME": ["Thompson", "Wilson", "Thompson"],
             "EMAIL": ["[email protected]"],
+            "PHONE_NUMBER": ["555-123-4567"],
+        },
     },
     {
         "description": "No PII Content",
 - Budget is within limits
 - Next review scheduled for next week
 """,
+        "expected_entities": {},
     },
     {
         "description": "Mixed Format Phone Numbers",
                 "(555) 123-4567",
                 "555.987.6543",
                 "+1-555-321-7890",
+                "555 444 3333",
             ]
+        },
+    },
 ]
 # Additional examples can be added to test specific edge cases or formats
             "EMAIL": [
                 "[email protected]",
                 "[email protected]",
+                "[email protected]",
             ],
             "GIVENNAME": ["John", "Jane", "Bob"],
+            "SURNAME": ["Doe", "Smith", "Jones"],
+        },
     }
 ]
 def validate_entities(detected: dict, expected: dict) -> bool:
     """Compare detected entities with expected entities"""
     if set(detected.keys()) != set(expected.keys()):
         return False
     return all(set(detected[k]) == set(expected[k]) for k in expected.keys())
 def run_test_case(guardrail, test_case, test_type="Main"):
     """Run a single test case and print results"""
     print(f"\n{test_type} Test Case: {test_case['description']}")
     print("-" * 50)
+    result = guardrail.guard(test_case["input_text"])
+    expected = test_case["expected_entities"]
     # Validate results
     matches = validate_entities(result.detected_entities, expected)
     print(f"Test Status: {'✓ PASS' if matches else '✗ FAIL'}")
     print(f"Contains PII: {result.contains_entities}")
     if not matches:
         print("\nEntity Comparison:")
+        all_entity_types = set(
+            list(result.detected_entities.keys()) + list(expected.keys())
+        )
         for entity_type in all_entity_types:
             detected = set(result.detected_entities.get(entity_type, []))
             expected_set = set(expected.get(entity_type, []))
             if detected != expected_set:
                 print(f"  Missing: {sorted(expected_set - detected)}")
                 print(f"  Extra: {sorted(detected - expected_set)}")
     if result.anonymized_text:
         print(f"\nAnonymized Text:\n{result.anonymized_text}")
+    return matches

guardrails_genie/guardrails/entity_recognition/pii_examples/run_presidio_model.py CHANGED Viewed

@@ -1,15 +1,22 @@
-from guardrails_genie.guardrails.entity_recognition.presidio_entity_recognition_guardrail import PresidioEntityRecognitionGuardrail
-from guardrails_genie.guardrails.entity_recognition.pii_examples.pii_test_examples import PII_TEST_EXAMPLES, EDGE_CASE_EXAMPLES, run_test_case, validate_entities
 import weave
 def test_pii_detection():
     """Test PII detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-pii-presidio-model")
     # Create the guardrail with default entities and anonymization enabled
     pii_guardrail = PresidioEntityRecognitionGuardrail(
-        should_anonymize=True,
-        show_available_entities=True
     )
     # Test statistics
@@ -38,5 +45,6 @@ def test_pii_detection():
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_pii_detection()

 import weave
+from guardrails_genie.guardrails.entity_recognition.pii_examples.pii_test_examples import (
+    EDGE_CASE_EXAMPLES,
+    PII_TEST_EXAMPLES,
+    run_test_case,
+)
+from guardrails_genie.guardrails.entity_recognition.presidio_entity_recognition_guardrail import (
+    PresidioEntityRecognitionGuardrail,
+)
 def test_pii_detection():
     """Test PII detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-pii-presidio-model")
     # Create the guardrail with default entities and anonymization enabled
     pii_guardrail = PresidioEntityRecognitionGuardrail(
+        should_anonymize=True, show_available_entities=True
     )
     # Test statistics
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_pii_detection()

guardrails_genie/guardrails/entity_recognition/pii_examples/run_regex_model.py CHANGED Viewed

@@ -1,15 +1,22 @@
-from guardrails_genie.guardrails.entity_recognition.regex_entity_recognition_guardrail import RegexEntityRecognitionGuardrail
-from guardrails_genie.guardrails.entity_recognition.pii_examples.pii_test_examples import PII_TEST_EXAMPLES, EDGE_CASE_EXAMPLES, run_test_case, validate_entities
 import weave
 def test_pii_detection():
     """Test PII detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-pii-regex-model")
     # Create the guardrail with default entities and anonymization enabled
     pii_guardrail = RegexEntityRecognitionGuardrail(
-        should_anonymize=True,
-        show_available_entities=True
     )
     # Test statistics
@@ -38,5 +45,6 @@ def test_pii_detection():
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_pii_detection()

 import weave
+from guardrails_genie.guardrails.entity_recognition.pii_examples.pii_test_examples import (
+    EDGE_CASE_EXAMPLES,
+    PII_TEST_EXAMPLES,
+    run_test_case,
+)
+from guardrails_genie.guardrails.entity_recognition.regex_entity_recognition_guardrail import (
+    RegexEntityRecognitionGuardrail,
+)
 def test_pii_detection():
     """Test PII detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-pii-regex-model")
     # Create the guardrail with default entities and anonymization enabled
     pii_guardrail = RegexEntityRecognitionGuardrail(
+        should_anonymize=True, show_available_entities=True
     )
     # Test statistics
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_pii_detection()

guardrails_genie/guardrails/entity_recognition/pii_examples/run_transformers.py CHANGED Viewed

@@ -1,16 +1,30 @@
-from guardrails_genie.guardrails.entity_recognition.transformers_entity_recognition_guardrail import TransformersEntityRecognitionGuardrail
-from guardrails_genie.guardrails.entity_recognition.pii_examples.pii_test_examples import PII_TEST_EXAMPLES, EDGE_CASE_EXAMPLES, run_test_case, validate_entities
 import weave
 def test_pii_detection():
     """Test PII detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-pii-transformers-pipeline-model")
     # Create the guardrail with default entities and anonymization enabled
     pii_guardrail = TransformersEntityRecognitionGuardrail(
-        selected_entities=["GIVENNAME", "SURNAME", "EMAIL", "TELEPHONENUM", "SOCIALNUM"],
         should_anonymize=True,
-        show_available_entities=True
     )
     # Test statistics
@@ -39,5 +53,6 @@ def test_pii_detection():
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_pii_detection()

 import weave
+from guardrails_genie.guardrails.entity_recognition.pii_examples.pii_test_examples import (
+    EDGE_CASE_EXAMPLES,
+    PII_TEST_EXAMPLES,
+    run_test_case,
+)
+from guardrails_genie.guardrails.entity_recognition.transformers_entity_recognition_guardrail import (
+    TransformersEntityRecognitionGuardrail,
+)
 def test_pii_detection():
     """Test PII detection scenarios using predefined test cases"""
     weave.init("guardrails-genie-pii-transformers-pipeline-model")
     # Create the guardrail with default entities and anonymization enabled
     pii_guardrail = TransformersEntityRecognitionGuardrail(
+        selected_entities=[
+            "GIVENNAME",
+            "SURNAME",
+            "EMAIL",
+            "TELEPHONENUM",
+            "SOCIALNUM",
+        ],
         should_anonymize=True,
+        show_available_entities=True,
     )
     # Test statistics
     print(f"Failed: {total_tests - passed_tests}")
     print(f"Success Rate: {(passed_tests/total_tests)*100:.1f}%")
 if __name__ == "__main__":
     test_pii_detection()

guardrails_genie/guardrails/entity_recognition/presidio_entity_recognition_guardrail.py CHANGED Viewed

@@ -1,12 +1,18 @@
-from typing import List, Dict, Optional, ClassVar, Any
-import weave
-from pydantic import BaseModel
-from presidio_analyzer import AnalyzerEngine, RecognizerRegistry, Pattern, PatternRecognizer
 from presidio_anonymizer import AnonymizerEngine
 from ..base import Guardrail
 class PresidioEntityRecognitionResponse(BaseModel):
     contains_entities: bool
     detected_entities: Dict[str, List[str]]
@@ -17,6 +23,7 @@ class PresidioEntityRecognitionResponse(BaseModel):
     def safe(self) -> bool:
         return not self.contains_entities
 class PresidioEntityRecognitionSimpleResponse(BaseModel):
     contains_entities: bool
     explanation: str
@@ -26,21 +33,24 @@ class PresidioEntityRecognitionSimpleResponse(BaseModel):
     def safe(self) -> bool:
         return not self.contains_entities
-#TODO: Add support for transformers workflow and not just Spacy
 class PresidioEntityRecognitionGuardrail(Guardrail):
     @staticmethod
     def get_available_entities() -> List[str]:
         registry = RecognizerRegistry()
         analyzer = AnalyzerEngine(registry=registry)
-        return [recognizer.supported_entities[0]
-                for recognizer in analyzer.registry.recognizers]
     analyzer: AnalyzerEngine
     anonymizer: AnonymizerEngine
     selected_entities: List[str]
     should_anonymize: bool
     language: str
     def __init__(
         self,
         selected_entities: Optional[List[str]] = None,
@@ -49,7 +59,7 @@ class PresidioEntityRecognitionGuardrail(Guardrail):
         deny_lists: Optional[Dict[str, List[str]]] = None,
         regex_patterns: Optional[Dict[str, List[Dict[str, str]]]] = None,
         custom_recognizers: Optional[List[Any]] = None,
-        show_available_entities: bool = False
     ):
         # If show_available_entities is True, print available entities
         if show_available_entities:
@@ -63,36 +73,37 @@ class PresidioEntityRecognitionGuardrail(Guardrail):
         # Initialize default values to all available entities
         if selected_entities is None:
             selected_entities = self.get_available_entities()
         # Get available entities dynamically
         available_entities = self.get_available_entities()
         # Filter out invalid entities and warn user
         invalid_entities = [e for e in selected_entities if e not in available_entities]
         valid_entities = [e for e in selected_entities if e in available_entities]
         if invalid_entities:
-            print(f"\nWarning: The following entities are not available and will be ignored: {invalid_entities}")
             print(f"Continuing with valid entities: {valid_entities}")
             selected_entities = valid_entities
         # Initialize analyzer with default recognizers
         analyzer = AnalyzerEngine()
         # Add custom recognizers if provided
         if custom_recognizers:
             for recognizer in custom_recognizers:
                 analyzer.registry.add_recognizer(recognizer)
         # Add deny list recognizers if provided
         if deny_lists:
             for entity_type, tokens in deny_lists.items():
                 deny_list_recognizer = PatternRecognizer(
-                    supported_entity=entity_type,
-                    deny_list=tokens
                 )
                 analyzer.registry.add_recognizer(deny_list_recognizer)
         # Add regex pattern recognizers if provided
         if regex_patterns:
             for entity_type, patterns in regex_patterns.items():
@@ -100,89 +111,92 @@ class PresidioEntityRecognitionGuardrail(Guardrail):
                     Pattern(
                         name=pattern.get("name", f"pattern_{i}"),
                         regex=pattern["regex"],
-                        score=pattern.get("score", 0.5)
-                    ) for i, pattern in enumerate(patterns)
                 ]
                 regex_recognizer = PatternRecognizer(
-                    supported_entity=entity_type,
-                    patterns=presidio_patterns
                 )
                 analyzer.registry.add_recognizer(regex_recognizer)
         # Initialize Presidio engines
         anonymizer = AnonymizerEngine()
         # Call parent class constructor with all fields
         super().__init__(
             analyzer=analyzer,
             anonymizer=anonymizer,
             selected_entities=selected_entities,
             should_anonymize=should_anonymize,
-            language=language
         )
     @weave.op()
-    def guard(self, prompt: str, return_detected_types: bool = True, **kwargs) -> PresidioEntityRecognitionResponse | PresidioEntityRecognitionSimpleResponse:
         """
         Check if the input prompt contains any entities using Presidio.
         Args:
             prompt: The text to analyze
             return_detected_types: If True, returns detailed entity type information
         """
         # Analyze text for entities
         analyzer_results = self.analyzer.analyze(
-            text=str(prompt),
-            entities=self.selected_entities,
-            language=self.language
         )
         # Group results by entity type
         detected_entities = {}
         for result in analyzer_results:
             entity_type = result.entity_type
-            text_slice = prompt[result.start:result.end]
             if entity_type not in detected_entities:
                 detected_entities[entity_type] = []
             detected_entities[entity_type].append(text_slice)
         # Create explanation
         explanation_parts = []
         if detected_entities:
             explanation_parts.append("Found the following entities in the text:")
             for entity_type, instances in detected_entities.items():
-                explanation_parts.append(f"- {entity_type}: {len(instances)} instance(s)")
         else:
             explanation_parts.append("No entities detected in the text.")
         # Add information about what was checked
         explanation_parts.append("\nChecked for these entity types:")
         for entity in self.selected_entities:
             explanation_parts.append(f"- {entity}")
         # Anonymize if requested
         anonymized_text = None
         if self.should_anonymize and detected_entities:
             anonymized_result = self.anonymizer.anonymize(
-                text=prompt,
-                analyzer_results=analyzer_results
             )
             anonymized_text = anonymized_result.text
         if return_detected_types:
             return PresidioEntityRecognitionResponse(
                 contains_entities=bool(detected_entities),
                 detected_entities=detected_entities,
                 explanation="\n".join(explanation_parts),
-                anonymized_text=anonymized_text
             )
         else:
             return PresidioEntityRecognitionSimpleResponse(
                 contains_entities=bool(detected_entities),
                 explanation="\n".join(explanation_parts),
-                anonymized_text=anonymized_text
             )
     @weave.op()
-    def predict(self, prompt: str, return_detected_types: bool = True, **kwargs) -> PresidioEntityRecognitionResponse | PresidioEntityRecognitionSimpleResponse:
-        return self.guard(prompt, return_detected_types=return_detected_types, **kwargs)

+from typing import Any, Dict, List, Optional
+import weave
+from presidio_analyzer import (
+    AnalyzerEngine,
+    Pattern,
+    PatternRecognizer,
+    RecognizerRegistry,
+)
 from presidio_anonymizer import AnonymizerEngine
+from pydantic import BaseModel
 from ..base import Guardrail
 class PresidioEntityRecognitionResponse(BaseModel):
     contains_entities: bool
     detected_entities: Dict[str, List[str]]
     def safe(self) -> bool:
         return not self.contains_entities
 class PresidioEntityRecognitionSimpleResponse(BaseModel):
     contains_entities: bool
     explanation: str
     def safe(self) -> bool:
         return not self.contains_entities
+# TODO: Add support for transformers workflow and not just Spacy
 class PresidioEntityRecognitionGuardrail(Guardrail):
     @staticmethod
     def get_available_entities() -> List[str]:
         registry = RecognizerRegistry()
         analyzer = AnalyzerEngine(registry=registry)
+        return [
+            recognizer.supported_entities[0]
+            for recognizer in analyzer.registry.recognizers
+        ]
     analyzer: AnalyzerEngine
     anonymizer: AnonymizerEngine
     selected_entities: List[str]
     should_anonymize: bool
     language: str
     def __init__(
         self,
         selected_entities: Optional[List[str]] = None,
         deny_lists: Optional[Dict[str, List[str]]] = None,
         regex_patterns: Optional[Dict[str, List[Dict[str, str]]]] = None,
         custom_recognizers: Optional[List[Any]] = None,
+        show_available_entities: bool = False,
     ):
         # If show_available_entities is True, print available entities
         if show_available_entities:
         # Initialize default values to all available entities
         if selected_entities is None:
             selected_entities = self.get_available_entities()
         # Get available entities dynamically
         available_entities = self.get_available_entities()
         # Filter out invalid entities and warn user
         invalid_entities = [e for e in selected_entities if e not in available_entities]
         valid_entities = [e for e in selected_entities if e in available_entities]
         if invalid_entities:
+            print(
+                f"\nWarning: The following entities are not available and will be ignored: {invalid_entities}"
+            )
             print(f"Continuing with valid entities: {valid_entities}")
             selected_entities = valid_entities
         # Initialize analyzer with default recognizers
         analyzer = AnalyzerEngine()
         # Add custom recognizers if provided
         if custom_recognizers:
             for recognizer in custom_recognizers:
                 analyzer.registry.add_recognizer(recognizer)
         # Add deny list recognizers if provided
         if deny_lists:
             for entity_type, tokens in deny_lists.items():
                 deny_list_recognizer = PatternRecognizer(
+                    supported_entity=entity_type, deny_list=tokens
                 )
                 analyzer.registry.add_recognizer(deny_list_recognizer)
         # Add regex pattern recognizers if provided
         if regex_patterns:
             for entity_type, patterns in regex_patterns.items():
                     Pattern(
                         name=pattern.get("name", f"pattern_{i}"),
                         regex=pattern["regex"],
+                        score=pattern.get("score", 0.5),
+                    )
+                    for i, pattern in enumerate(patterns)
                 ]
                 regex_recognizer = PatternRecognizer(
+                    supported_entity=entity_type, patterns=presidio_patterns
                 )
                 analyzer.registry.add_recognizer(regex_recognizer)
         # Initialize Presidio engines
         anonymizer = AnonymizerEngine()
         # Call parent class constructor with all fields
         super().__init__(
             analyzer=analyzer,
             anonymizer=anonymizer,
             selected_entities=selected_entities,
             should_anonymize=should_anonymize,
+            language=language,
         )
     @weave.op()
+    def guard(
+        self, prompt: str, return_detected_types: bool = True, **kwargs
+    ) -> PresidioEntityRecognitionResponse | PresidioEntityRecognitionSimpleResponse:
         """
         Check if the input prompt contains any entities using Presidio.
         Args:
             prompt: The text to analyze
             return_detected_types: If True, returns detailed entity type information
         """
         # Analyze text for entities
         analyzer_results = self.analyzer.analyze(
+            text=str(prompt), entities=self.selected_entities, language=self.language
         )
         # Group results by entity type
         detected_entities = {}
         for result in analyzer_results:
             entity_type = result.entity_type
+            text_slice = prompt[result.start : result.end]
             if entity_type not in detected_entities:
                 detected_entities[entity_type] = []
             detected_entities[entity_type].append(text_slice)
         # Create explanation
         explanation_parts = []
         if detected_entities:
             explanation_parts.append("Found the following entities in the text:")
             for entity_type, instances in detected_entities.items():
+                explanation_parts.append(
+                    f"- {entity_type}: {len(instances)} instance(s)"
+                )
         else:
             explanation_parts.append("No entities detected in the text.")
         # Add information about what was checked
         explanation_parts.append("\nChecked for these entity types:")
         for entity in self.selected_entities:
             explanation_parts.append(f"- {entity}")
         # Anonymize if requested
         anonymized_text = None
         if self.should_anonymize and detected_entities:
             anonymized_result = self.anonymizer.anonymize(
+                text=prompt, analyzer_results=analyzer_results
             )
             anonymized_text = anonymized_result.text
         if return_detected_types:
             return PresidioEntityRecognitionResponse(
                 contains_entities=bool(detected_entities),
                 detected_entities=detected_entities,
                 explanation="\n".join(explanation_parts),
+                anonymized_text=anonymized_text,
             )
         else:
             return PresidioEntityRecognitionSimpleResponse(
                 contains_entities=bool(detected_entities),
                 explanation="\n".join(explanation_parts),
+                anonymized_text=anonymized_text,
             )
     @weave.op()
+    def predict(
+        self, prompt: str, return_detected_types: bool = True, **kwargs
+    ) -> PresidioEntityRecognitionResponse | PresidioEntityRecognitionSimpleResponse:
+        return self.guard(prompt, return_detected_types=return_detected_types, **kwargs)

guardrails_genie/guardrails/entity_recognition/regex_entity_recognition_guardrail.py CHANGED Viewed

@@ -1,11 +1,11 @@
-from typing import Dict, Optional, ClassVar, List
 import weave
 from pydantic import BaseModel
 from ...regex_model import RegexModel
 from ..base import Guardrail
-import re
 class RegexEntityRecognitionResponse(BaseModel):
@@ -33,28 +33,34 @@ class RegexEntityRecognitionGuardrail(Guardrail):
     regex_model: RegexModel
     patterns: Dict[str, str] = {}
     should_anonymize: bool = False
     DEFAULT_PATTERNS: ClassVar[Dict[str, str]] = {
-        "EMAIL": r'\b[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Z|a-z]{2,}\b',
-        "TELEPHONENUM": r'\b(\+\d{1,3}[-.]?)?\(?\d{3}\)?[-.]?\d{3}[-.]?\d{4}\b',
-        "SOCIALNUM": r'\b\d{3}[-]?\d{2}[-]?\d{4}\b',
-        "CREDITCARDNUMBER": r'\b\d{4}[-\s]?\d{4}[-\s]?\d{4}[-\s]?\d{4}\b',
-        "DATEOFBIRTH": r'\b(0[1-9]|1[0-2])[-/](0[1-9]|[12]\d|3[01])[-/](19|20)\d{2}\b',
-        "DRIVERLICENSENUM": r'[A-Z]\d{7}',  # Example pattern, adjust for your needs
-        "ACCOUNTNUM": r'\b\d{10,12}\b',  # Example pattern for bank accounts
-        "ZIPCODE": r'\b\d{5}(?:-\d{4})?\b',
-        "GIVENNAME": r'\b[A-Z][a-z]+\b',  # Basic pattern for first names
-        "SURNAME": r'\b[A-Z][a-z]+\b',    # Basic pattern for last names
-        "CITY": r'\b[A-Z][a-z]+(?:[\s-][A-Z][a-z]+)*\b',
-        "STREET": r'\b\d+\s+[A-Z][a-z]+\s+(?:Street|St|Avenue|Ave|Road|Rd|Boulevard|Blvd|Lane|Ln|Drive|Dr)\b',
-        "IDCARDNUM": r'[A-Z]\d{7,8}',  # Generic pattern for ID cards
-        "USERNAME": r'@[A-Za-z]\w{3,}',  # Basic username pattern
-        "PASSWORD": r'[A-Za-z0-9@#$%^&+=]{8,}',  # Basic password pattern
-        "TAXNUM": r'\b\d{2}[-]\d{7}\b',  # Example tax number pattern
-        "BUILDINGNUM": r'\b\d+[A-Za-z]?\b'  # Basic building number pattern
     }
-    def __init__(self, use_defaults: bool = True, should_anonymize: bool = False, show_available_entities: bool = False, **kwargs):
         patterns = {}
         if use_defaults:
             patterns = self.DEFAULT_PATTERNS.copy()
@@ -63,15 +69,15 @@ class RegexEntityRecognitionGuardrail(Guardrail):
         if show_available_entities:
             self._print_available_entities(patterns.keys())
         # Create the RegexModel instance
         regex_model = RegexModel(patterns=patterns)
         # Initialize the base class with both the regex_model and patterns
         super().__init__(
-            regex_model=regex_model,
             patterns=patterns,
-            should_anonymize=should_anonymize
         )
     def text_to_pattern(self, text: str) -> str:
@@ -82,7 +88,7 @@ class RegexEntityRecognitionGuardrail(Guardrail):
         escaped_text = re.escape(text)
         # Create a pattern that matches the exact text, case-insensitive
         return rf"\b{escaped_text}\b"
     def _print_available_entities(self, entities: List[str]):
         """Print available entities"""
         print("\nAvailable entity types:")
@@ -92,16 +98,23 @@ class RegexEntityRecognitionGuardrail(Guardrail):
         print("=" * 25 + "\n")
     @weave.op()
-    def guard(self, prompt: str, custom_terms: Optional[list[str]] = None, return_detected_types: bool = True, aggregate_redaction: bool = True, **kwargs) -> RegexEntityRecognitionResponse | RegexEntityRecognitionSimpleResponse:
         """
         Check if the input prompt contains any entities based on the regex patterns.
         Args:
             prompt: Input text to check for entities
-            custom_terms: List of custom terms to be converted into regex patterns. If provided,
                         only these terms will be checked, ignoring default patterns.
             return_detected_types: If True, returns detailed entity type information
         Returns:
             RegexEntityRecognitionResponse or RegexEntityRecognitionSimpleResponse containing detection results
         """
@@ -113,7 +126,7 @@ class RegexEntityRecognitionGuardrail(Guardrail):
         else:
             # Use the original regex_model if no custom terms provided
             result = self.regex_model.check(prompt)
         # Create detailed explanation
         explanation_parts = []
         if result.matched_patterns:
@@ -122,35 +135,50 @@ class RegexEntityRecognitionGuardrail(Guardrail):
                 explanation_parts.append(f"- {entity_type}: {len(matches)} instance(s)")
         else:
             explanation_parts.append("No entities detected in the text.")
         if result.failed_patterns:
             explanation_parts.append("\nChecked but did not find these entity types:")
             for pattern in result.failed_patterns:
                 explanation_parts.append(f"- {pattern}")
         # Updated anonymization logic
         anonymized_text = None
-        if getattr(self, 'should_anonymize', False) and result.matched_patterns:
             anonymized_text = prompt
             for entity_type, matches in result.matched_patterns.items():
                 for match in matches:
-                    replacement = "[redacted]" if aggregate_redaction else f"[{entity_type.upper()}]"
                     anonymized_text = anonymized_text.replace(match, replacement)
         if return_detected_types:
             return RegexEntityRecognitionResponse(
                 contains_entities=not result.passed,
                 detected_entities=result.matched_patterns,
                 explanation="\n".join(explanation_parts),
-                anonymized_text=anonymized_text
             )
         else:
             return RegexEntityRecognitionSimpleResponse(
                 contains_entities=not result.passed,
                 explanation="\n".join(explanation_parts),
-                anonymized_text=anonymized_text
             )
     @weave.op()
-    def predict(self, prompt: str, return_detected_types: bool = True, aggregate_redaction: bool = True, **kwargs) -> RegexEntityRecognitionResponse | RegexEntityRecognitionSimpleResponse:
-        return self.guard(prompt, return_detected_types=return_detected_types, aggregate_redaction=aggregate_redaction, **kwargs)

+import re
+from typing import ClassVar, Dict, List, Optional
 import weave
 from pydantic import BaseModel
 from ...regex_model import RegexModel
 from ..base import Guardrail
 class RegexEntityRecognitionResponse(BaseModel):
     regex_model: RegexModel
     patterns: Dict[str, str] = {}
     should_anonymize: bool = False
     DEFAULT_PATTERNS: ClassVar[Dict[str, str]] = {
+        "EMAIL": r"\b[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Z|a-z]{2,}\b",
+        "TELEPHONENUM": r"\b(\+\d{1,3}[-.]?)?\(?\d{3}\)?[-.]?\d{3}[-.]?\d{4}\b",
+        "SOCIALNUM": r"\b\d{3}[-]?\d{2}[-]?\d{4}\b",
+        "CREDITCARDNUMBER": r"\b\d{4}[-\s]?\d{4}[-\s]?\d{4}[-\s]?\d{4}\b",
+        "DATEOFBIRTH": r"\b(0[1-9]|1[0-2])[-/](0[1-9]|[12]\d|3[01])[-/](19|20)\d{2}\b",
+        "DRIVERLICENSENUM": r"[A-Z]\d{7}",  # Example pattern, adjust for your needs
+        "ACCOUNTNUM": r"\b\d{10,12}\b",  # Example pattern for bank accounts
+        "ZIPCODE": r"\b\d{5}(?:-\d{4})?\b",
+        "GIVENNAME": r"\b[A-Z][a-z]+\b",  # Basic pattern for first names
+        "SURNAME": r"\b[A-Z][a-z]+\b",  # Basic pattern for last names
+        "CITY": r"\b[A-Z][a-z]+(?:[\s-][A-Z][a-z]+)*\b",
+        "STREET": r"\b\d+\s+[A-Z][a-z]+\s+(?:Street|St|Avenue|Ave|Road|Rd|Boulevard|Blvd|Lane|Ln|Drive|Dr)\b",
+        "IDCARDNUM": r"[A-Z]\d{7,8}",  # Generic pattern for ID cards
+        "USERNAME": r"@[A-Za-z]\w{3,}",  # Basic username pattern
+        "PASSWORD": r"[A-Za-z0-9@#$%^&+=]{8,}",  # Basic password pattern
+        "TAXNUM": r"\b\d{2}[-]\d{7}\b",  # Example tax number pattern
+        "BUILDINGNUM": r"\b\d+[A-Za-z]?\b",  # Basic building number pattern
     }
+    def __init__(
+        self,
+        use_defaults: bool = True,
+        should_anonymize: bool = False,
+        show_available_entities: bool = False,
+        **kwargs,
+    ):
         patterns = {}
         if use_defaults:
             patterns = self.DEFAULT_PATTERNS.copy()
         if show_available_entities:
             self._print_available_entities(patterns.keys())
         # Create the RegexModel instance
         regex_model = RegexModel(patterns=patterns)
         # Initialize the base class with both the regex_model and patterns
         super().__init__(
+            regex_model=regex_model,
             patterns=patterns,
+            should_anonymize=should_anonymize,
         )
     def text_to_pattern(self, text: str) -> str:
         escaped_text = re.escape(text)
         # Create a pattern that matches the exact text, case-insensitive
         return rf"\b{escaped_text}\b"
     def _print_available_entities(self, entities: List[str]):
         """Print available entities"""
         print("\nAvailable entity types:")
         print("=" * 25 + "\n")
     @weave.op()
+    def guard(
+        self,
+        prompt: str,
+        custom_terms: Optional[list[str]] = None,
+        return_detected_types: bool = True,
+        aggregate_redaction: bool = True,
+        **kwargs,
+    ) -> RegexEntityRecognitionResponse | RegexEntityRecognitionSimpleResponse:
         """
         Check if the input prompt contains any entities based on the regex patterns.
         Args:
             prompt: Input text to check for entities
+            custom_terms: List of custom terms to be converted into regex patterns. If provided,
                         only these terms will be checked, ignoring default patterns.
             return_detected_types: If True, returns detailed entity type information
         Returns:
             RegexEntityRecognitionResponse or RegexEntityRecognitionSimpleResponse containing detection results
         """
         else:
             # Use the original regex_model if no custom terms provided
             result = self.regex_model.check(prompt)
         # Create detailed explanation
         explanation_parts = []
         if result.matched_patterns:
                 explanation_parts.append(f"- {entity_type}: {len(matches)} instance(s)")
         else:
             explanation_parts.append("No entities detected in the text.")
         if result.failed_patterns:
             explanation_parts.append("\nChecked but did not find these entity types:")
             for pattern in result.failed_patterns:
                 explanation_parts.append(f"- {pattern}")
         # Updated anonymization logic
         anonymized_text = None
+        if getattr(self, "should_anonymize", False) and result.matched_patterns:
             anonymized_text = prompt
             for entity_type, matches in result.matched_patterns.items():
                 for match in matches:
+                    replacement = (
+                        "[redacted]"
+                        if aggregate_redaction
+                        else f"[{entity_type.upper()}]"
+                    )
                     anonymized_text = anonymized_text.replace(match, replacement)
         if return_detected_types:
             return RegexEntityRecognitionResponse(
                 contains_entities=not result.passed,
                 detected_entities=result.matched_patterns,
                 explanation="\n".join(explanation_parts),
+                anonymized_text=anonymized_text,
             )
         else:
             return RegexEntityRecognitionSimpleResponse(
                 contains_entities=not result.passed,
                 explanation="\n".join(explanation_parts),
+                anonymized_text=anonymized_text,
             )
     @weave.op()
+    def predict(
+        self,
+        prompt: str,
+        return_detected_types: bool = True,
+        aggregate_redaction: bool = True,
+        **kwargs,
+    ) -> RegexEntityRecognitionResponse | RegexEntityRecognitionSimpleResponse:
+        return self.guard(
+            prompt,
+            return_detected_types=return_detected_types,
+            aggregate_redaction=aggregate_redaction,
+            **kwargs,
+        )

guardrails_genie/guardrails/entity_recognition/transformers_entity_recognition_guardrail.py CHANGED Viewed

@@ -1,9 +1,11 @@
-from typing import List, Dict, Optional, ClassVar
-from transformers import pipeline, AutoConfig
-import json
 from pydantic import BaseModel
 from ..base import Guardrail
-import weave
 class TransformersEntityRecognitionResponse(BaseModel):
     contains_entities: bool
@@ -15,6 +17,7 @@ class TransformersEntityRecognitionResponse(BaseModel):
     def safe(self) -> bool:
         return not self.contains_entities
 class TransformersEntityRecognitionSimpleResponse(BaseModel):
     contains_entities: bool
     explanation: str
@@ -24,14 +27,15 @@ class TransformersEntityRecognitionSimpleResponse(BaseModel):
     def safe(self) -> bool:
         return not self.contains_entities
 class TransformersEntityRecognitionGuardrail(Guardrail):
     """Generic guardrail for detecting entities using any token classification model."""
     _pipeline: Optional[object] = None
     selected_entities: List[str]
     should_anonymize: bool
     available_entities: List[str]
     def __init__(
         self,
         model_name: str = "iiiorg/piiranha-v1-detect-personal-information",
@@ -42,50 +46,52 @@ class TransformersEntityRecognitionGuardrail(Guardrail):
         # Load model config and extract available entities
         config = AutoConfig.from_pretrained(model_name)
         entities = self._extract_entities_from_config(config)
         if show_available_entities:
             self._print_available_entities(entities)
         # Initialize default values if needed
         if selected_entities is None:
             selected_entities = entities  # Use all available entities by default
         # Filter out invalid entities and warn user
         invalid_entities = [e for e in selected_entities if e not in entities]
         valid_entities = [e for e in selected_entities if e in entities]
         if invalid_entities:
-            print(f"\nWarning: The following entities are not available and will be ignored: {invalid_entities}")
             print(f"Continuing with valid entities: {valid_entities}")
             selected_entities = valid_entities
         # Call parent class constructor
         super().__init__(
             selected_entities=selected_entities,
             should_anonymize=should_anonymize,
-            available_entities=entities
         )
         # Initialize pipeline
         self._pipeline = pipeline(
             task="token-classification",
             model=model_name,
-            aggregation_strategy="simple"  # Merge same entities
         )
     def _extract_entities_from_config(self, config) -> List[str]:
         """Extract unique entity types from the model config."""
         # Get id2label mapping from config
         id2label = config.id2label
         # Extract unique entity types (removing B- and I- prefixes)
         entities = set()
         for label in id2label.values():
-            if label.startswith(('B-', 'I-')):
                 entities.add(label[2:])  # Remove prefix
-            elif label != 'O':  # Skip the 'O' (Outside) label
                 entities.add(label)
         return sorted(list(entities))
     def _print_available_entities(self, entities: List[str]):
@@ -103,48 +109,60 @@ class TransformersEntityRecognitionGuardrail(Guardrail):
     def _detect_entities(self, text: str) -> Dict[str, List[str]]:
         """Detect entities in the text using the pipeline."""
         results = self._pipeline(text)
         # Group findings by entity type
         detected_entities = {}
         for entity in results:
-            entity_type = entity['entity_group']
             if entity_type in self.selected_entities:
                 if entity_type not in detected_entities:
                     detected_entities[entity_type] = []
-                detected_entities[entity_type].append(entity['word'])
         return detected_entities
     def _anonymize_text(self, text: str, aggregate_redaction: bool = True) -> str:
         """Anonymize detected entities in text using the pipeline."""
         results = self._pipeline(text)
         # Sort entities by start position in reverse order to avoid offset issues
-        entities = sorted(results, key=lambda x: x['start'], reverse=True)
         # Create a mutable list of characters
         chars = list(text)
         # Apply redactions
         for entity in entities:
-            if entity['entity_group'] in self.selected_entities:
-                start, end = entity['start'], entity['end']
-                replacement = ' [redacted] ' if aggregate_redaction else f" [{entity['entity_group']}] "
                 # Replace the entity with the redaction marker
                 chars[start:end] = replacement
         # Join characters and clean up only consecutive spaces (preserving newlines)
-        result = ''.join(chars)
         # Replace multiple spaces with single space, but preserve newlines
-        lines = result.split('\n')
-        cleaned_lines = [' '.join(line.split()) for line in lines]
-        return '\n'.join(cleaned_lines)
     @weave.op()
-    def guard(self, prompt: str, return_detected_types: bool = True, aggregate_redaction: bool = True) -> TransformersEntityRecognitionResponse | TransformersEntityRecognitionSimpleResponse:
         """Check if the input prompt contains any entities using the transformer pipeline.
         Args:
             prompt: The text to analyze
             return_detected_types: If True, returns detailed entity type information
@@ -152,39 +170,55 @@ class TransformersEntityRecognitionGuardrail(Guardrail):
         """
         # Detect entities
         detected_entities = self._detect_entities(prompt)
         # Create explanation
         explanation_parts = []
         if detected_entities:
             explanation_parts.append("Found the following entities in the text:")
             for entity_type, instances in detected_entities.items():
-                explanation_parts.append(f"- {entity_type}: {len(instances)} instance(s)")
         else:
             explanation_parts.append("No entities detected in the text.")
         explanation_parts.append("\nChecked for these entities:")
         for entity in self.selected_entities:
             explanation_parts.append(f"- {entity}")
         # Anonymize if requested
         anonymized_text = None
         if self.should_anonymize and detected_entities:
             anonymized_text = self._anonymize_text(prompt, aggregate_redaction)
         if return_detected_types:
             return TransformersEntityRecognitionResponse(
                 contains_entities=bool(detected_entities),
                 detected_entities=detected_entities,
                 explanation="\n".join(explanation_parts),
-                anonymized_text=anonymized_text
             )
         else:
             return TransformersEntityRecognitionSimpleResponse(
                 contains_entities=bool(detected_entities),
                 explanation="\n".join(explanation_parts),
-                anonymized_text=anonymized_text
             )
     @weave.op()
-    def predict(self, prompt: str, return_detected_types: bool = True, aggregate_redaction: bool = True, **kwargs) -> TransformersEntityRecognitionResponse | TransformersEntityRecognitionSimpleResponse:
-        return self.guard(prompt, return_detected_types=return_detected_types, aggregate_redaction=aggregate_redaction, **kwargs)

+from typing import Dict, List, Optional
+import weave
 from pydantic import BaseModel
+from transformers import AutoConfig, pipeline
 from ..base import Guardrail
 class TransformersEntityRecognitionResponse(BaseModel):
     contains_entities: bool
     def safe(self) -> bool:
         return not self.contains_entities
 class TransformersEntityRecognitionSimpleResponse(BaseModel):
     contains_entities: bool
     explanation: str
     def safe(self) -> bool:
         return not self.contains_entities
 class TransformersEntityRecognitionGuardrail(Guardrail):
     """Generic guardrail for detecting entities using any token classification model."""
     _pipeline: Optional[object] = None
     selected_entities: List[str]
     should_anonymize: bool
     available_entities: List[str]
     def __init__(
         self,
         model_name: str = "iiiorg/piiranha-v1-detect-personal-information",
         # Load model config and extract available entities
         config = AutoConfig.from_pretrained(model_name)
         entities = self._extract_entities_from_config(config)
         if show_available_entities:
             self._print_available_entities(entities)
         # Initialize default values if needed
         if selected_entities is None:
             selected_entities = entities  # Use all available entities by default
         # Filter out invalid entities and warn user
         invalid_entities = [e for e in selected_entities if e not in entities]
         valid_entities = [e for e in selected_entities if e in entities]
         if invalid_entities:
+            print(
+                f"\nWarning: The following entities are not available and will be ignored: {invalid_entities}"
+            )
             print(f"Continuing with valid entities: {valid_entities}")
             selected_entities = valid_entities
         # Call parent class constructor
         super().__init__(
             selected_entities=selected_entities,
             should_anonymize=should_anonymize,
+            available_entities=entities,
         )
         # Initialize pipeline
         self._pipeline = pipeline(
             task="token-classification",
             model=model_name,
+            aggregation_strategy="simple",  # Merge same entities
         )
     def _extract_entities_from_config(self, config) -> List[str]:
         """Extract unique entity types from the model config."""
         # Get id2label mapping from config
         id2label = config.id2label
         # Extract unique entity types (removing B- and I- prefixes)
         entities = set()
         for label in id2label.values():
+            if label.startswith(("B-", "I-")):
                 entities.add(label[2:])  # Remove prefix
+            elif label != "O":  # Skip the 'O' (Outside) label
                 entities.add(label)
         return sorted(list(entities))
     def _print_available_entities(self, entities: List[str]):
     def _detect_entities(self, text: str) -> Dict[str, List[str]]:
         """Detect entities in the text using the pipeline."""
         results = self._pipeline(text)
         # Group findings by entity type
         detected_entities = {}
         for entity in results:
+            entity_type = entity["entity_group"]
             if entity_type in self.selected_entities:
                 if entity_type not in detected_entities:
                     detected_entities[entity_type] = []
+                detected_entities[entity_type].append(entity["word"])
         return detected_entities
     def _anonymize_text(self, text: str, aggregate_redaction: bool = True) -> str:
         """Anonymize detected entities in text using the pipeline."""
         results = self._pipeline(text)
         # Sort entities by start position in reverse order to avoid offset issues
+        entities = sorted(results, key=lambda x: x["start"], reverse=True)
         # Create a mutable list of characters
         chars = list(text)
         # Apply redactions
         for entity in entities:
+            if entity["entity_group"] in self.selected_entities:
+                start, end = entity["start"], entity["end"]
+                replacement = (
+                    " [redacted] "
+                    if aggregate_redaction
+                    else f" [{entity['entity_group']}] "
+                )
                 # Replace the entity with the redaction marker
                 chars[start:end] = replacement
         # Join characters and clean up only consecutive spaces (preserving newlines)
+        result = "".join(chars)
         # Replace multiple spaces with single space, but preserve newlines
+        lines = result.split("\n")
+        cleaned_lines = [" ".join(line.split()) for line in lines]
+        return "\n".join(cleaned_lines)
     @weave.op()
+    def guard(
+        self,
+        prompt: str,
+        return_detected_types: bool = True,
+        aggregate_redaction: bool = True,
+    ) -> (
+        TransformersEntityRecognitionResponse
+        | TransformersEntityRecognitionSimpleResponse
+    ):
         """Check if the input prompt contains any entities using the transformer pipeline.
         Args:
             prompt: The text to analyze
             return_detected_types: If True, returns detailed entity type information
         """
         # Detect entities
         detected_entities = self._detect_entities(prompt)
         # Create explanation
         explanation_parts = []
         if detected_entities:
             explanation_parts.append("Found the following entities in the text:")
             for entity_type, instances in detected_entities.items():
+                explanation_parts.append(
+                    f"- {entity_type}: {len(instances)} instance(s)"
+                )
         else:
             explanation_parts.append("No entities detected in the text.")
         explanation_parts.append("\nChecked for these entities:")
         for entity in self.selected_entities:
             explanation_parts.append(f"- {entity}")
         # Anonymize if requested
         anonymized_text = None
         if self.should_anonymize and detected_entities:
             anonymized_text = self._anonymize_text(prompt, aggregate_redaction)
         if return_detected_types:
             return TransformersEntityRecognitionResponse(
                 contains_entities=bool(detected_entities),
                 detected_entities=detected_entities,
                 explanation="\n".join(explanation_parts),
+                anonymized_text=anonymized_text,
             )
         else:
             return TransformersEntityRecognitionSimpleResponse(
                 contains_entities=bool(detected_entities),
                 explanation="\n".join(explanation_parts),
+                anonymized_text=anonymized_text,
             )
     @weave.op()
+    def predict(
+        self,
+        prompt: str,
+        return_detected_types: bool = True,
+        aggregate_redaction: bool = True,
+        **kwargs,
+    ) -> (
+        TransformersEntityRecognitionResponse
+        | TransformersEntityRecognitionSimpleResponse
+    ):
+        return self.guard(
+            prompt,
+            return_detected_types=return_detected_types,
+            aggregate_redaction=aggregate_redaction,
+            **kwargs,
+        )

guardrails_genie/guardrails/manager.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import weave
-from rich.progress import track
 from pydantic import BaseModel
 from .base import Guardrail

 import weave
 from pydantic import BaseModel
+from rich.progress import track
 from .base import Guardrail

guardrails_genie/metrics.py CHANGED Viewed

@@ -5,12 +5,55 @@ import weave
 class AccuracyMetric(weave.Scorer):
     @weave.op()
     def score(self, output: dict, label: int):
-        return {"correct": bool(label) == output["safe"]}
     @weave.op()
     def summarize(self, score_rows: list) -> Optional[dict]:
         valid_data = [
             x.get("correct") for x in score_rows if x.get("correct") is not None
         ]

 class AccuracyMetric(weave.Scorer):
+    """
+    A class to compute and summarize accuracy-related metrics for model outputs.
+    This class extends the `weave.Scorer` and provides operations to score
+    individual predictions and summarize the results across multiple predictions.
+    It calculates the accuracy, precision, recall, and F1 score based on the
+    comparison between predicted outputs and true labels.
+    """
     @weave.op()
     def score(self, output: dict, label: int):
+        """
+        Evaluate the correctness of a single prediction.
+        This method compares a model's predicted output with the true label
+        to determine if the prediction is correct. It checks if the 'safe'
+        field in the output dictionary, when converted to an integer, matches
+        the provided label.
+        Args:
+            output (dict): A dictionary containing the model's prediction,
+                specifically the 'safe' key which holds the predicted value.
+            label (int): The true label against which the prediction is compared.
+        Returns:
+            dict: A dictionary with a single key 'correct', which is True if the
+          prediction matches the label, otherwise False.
+        """
+        return {"correct": label == int(output["safe"])}
     @weave.op()
     def summarize(self, score_rows: list) -> Optional[dict]:
+        """
+        Summarize the accuracy-related metrics from a list of prediction scores.
+        This method processes a list of score dictionaries, each containing a
+        'correct' key indicating whether a prediction was correct. It calculates
+        several metrics: accuracy, precision, recall, and F1 score, based on the
+        number of true positives, false positives, and false negatives.
+        Args:
+            score_rows (list): A list of dictionaries, each with a 'correct' key
+              indicating the correctness of individual predictions.
+        Returns:
+            Optional[dict]: A dictionary containing the calculated metrics:
+                'accuracy', 'precision', 'recall', and 'f1_score'. If no valid data
+                is present, all metrics default to 0.
+        """
         valid_data = [
             x.get("correct") for x in score_rows if x.get("correct") is not None
         ]

guardrails_genie/regex_model.py CHANGED Viewed

@@ -1,5 +1,6 @@
-from typing import List, Dict, Optional
 import re
 import weave
 from pydantic import BaseModel
@@ -16,7 +17,7 @@ class RegexModel(weave.Model):
     def __init__(self, patterns: Dict[str, str]) -> None:
         """
         Initialize RegexModel with a dictionary of patterns.
         Args:
             patterns: Dictionary where key is pattern name and value is regex pattern
                      Example: {"email": r"[^@ \t\r\n]+@[^@ \t\r\n]+\.[^@ \t\r\n]+",
@@ -31,35 +32,37 @@ class RegexModel(weave.Model):
     def check(self, prompt: str) -> RegexResult:
         """
         Check text against all patterns and return detailed results.
         Args:
             text: Input text to check against patterns
         Returns:
             RegexResult containing pass/fail status and details about matches
         """
         matched_patterns = {}
         failed_patterns = []
         for pattern_name, pattern in self.patterns.items():
             matches = []
             for match in re.finditer(pattern, prompt):
                 if match.groups():
                     # If there are capture groups, join them with a separator
-                    matches.append('-'.join(str(g) for g in match.groups() if g is not None))
                 else:
                     # If no capture groups, use the full match
                     matches.append(match.group(0))
             if matches:
                 matched_patterns[pattern_name] = matches
             else:
                 failed_patterns.append(pattern_name)
         return RegexResult(
             matched_patterns=matched_patterns,
             failed_patterns=failed_patterns,
-            passed=len(matched_patterns) == 0
         )
     @weave.op()
@@ -67,4 +70,4 @@ class RegexModel(weave.Model):
         """
         Alias for check() to maintain consistency with other models.
         """
-        return self.check(text)

 import re
+from typing import Dict, List
 import weave
 from pydantic import BaseModel
     def __init__(self, patterns: Dict[str, str]) -> None:
         """
         Initialize RegexModel with a dictionary of patterns.
         Args:
             patterns: Dictionary where key is pattern name and value is regex pattern
                      Example: {"email": r"[^@ \t\r\n]+@[^@ \t\r\n]+\.[^@ \t\r\n]+",
     def check(self, prompt: str) -> RegexResult:
         """
         Check text against all patterns and return detailed results.
         Args:
             text: Input text to check against patterns
         Returns:
             RegexResult containing pass/fail status and details about matches
         """
         matched_patterns = {}
         failed_patterns = []
         for pattern_name, pattern in self.patterns.items():
             matches = []
             for match in re.finditer(pattern, prompt):
                 if match.groups():
                     # If there are capture groups, join them with a separator
+                    matches.append(
+                        "-".join(str(g) for g in match.groups() if g is not None)
+                    )
                 else:
                     # If no capture groups, use the full match
                     matches.append(match.group(0))
             if matches:
                 matched_patterns[pattern_name] = matches
             else:
                 failed_patterns.append(pattern_name)
         return RegexResult(
             matched_patterns=matched_patterns,
             failed_patterns=failed_patterns,
+            passed=len(matched_patterns) == 0,
         )
     @weave.op()
         """
         Alias for check() to maintain consistency with other models.
         """
+        return self.check(text)

guardrails_genie/utils.py CHANGED Viewed

@@ -19,9 +19,9 @@ class EvaluationCallManager:
     """
     Manages the evaluation calls for a specific project and entity in Weave.
-    This class is responsible for initializing and managing evaluation calls associated with a
-    specific project and entity. It provides functionality to collect guardrail guard calls
-    from evaluation predictions and scores, and render these calls into a structured format
     suitable for display in Streamlit.
     Args:
@@ -30,6 +30,7 @@ class EvaluationCallManager:
         call_id (str): The call id.
         max_count (int): The maximum number of guardrail guard calls to collect from the evaluation.
     """
     def __init__(self, entity: str, project: str, call_id: str, max_count: int = 10):
         self.base_call = weave.init(f"{entity}/{project}").get_call(call_id=call_id)
         self.max_count = max_count
@@ -40,10 +41,10 @@ class EvaluationCallManager:
         """
         Collects guardrail guard calls from evaluation predictions and scores.
-        This function iterates through the children calls of the base evaluation call,
-        extracting relevant guardrail guard calls and their associated scores. It stops
-        collecting calls if it encounters an "Evaluation.summarize" operation or if the
-        maximum count of guardrail guard calls is reached. The collected calls are stored
         in a list of dictionaries, each containing the input prompt, outputs, and score.
         Returns:
@@ -77,9 +78,9 @@ class EvaluationCallManager:
         Renders the collected guardrail guard calls into a pandas DataFrame suitable for
         display in Streamlit.
-        This function processes the collected guardrail guard calls stored in `self.call_list` and
-        organizes them into a dictionary format that can be easily converted into a pandas DataFrame.
-        The DataFrame contains columns for the input prompts, the safety status of the outputs, and
         the correctness of the predictions for each guardrail.
         The structure of the DataFrame is as follows:
@@ -87,7 +88,7 @@ class EvaluationCallManager:
         - Subsequent columns contain the safety status and prediction correctness for each guardrail.
         Returns:
-            pd.DataFrame: A DataFrame containing the input prompts, safety status, and prediction
                           correctness for each guardrail.
         """
         dataframe = {

     """
     Manages the evaluation calls for a specific project and entity in Weave.
+    This class is responsible for initializing and managing evaluation calls associated with a
+    specific project and entity. It provides functionality to collect guardrail guard calls
+    from evaluation predictions and scores, and render these calls into a structured format
     suitable for display in Streamlit.
     Args:
         call_id (str): The call id.
         max_count (int): The maximum number of guardrail guard calls to collect from the evaluation.
     """
     def __init__(self, entity: str, project: str, call_id: str, max_count: int = 10):
         self.base_call = weave.init(f"{entity}/{project}").get_call(call_id=call_id)
         self.max_count = max_count
         """
         Collects guardrail guard calls from evaluation predictions and scores.
+        This function iterates through the children calls of the base evaluation call,
+        extracting relevant guardrail guard calls and their associated scores. It stops
+        collecting calls if it encounters an "Evaluation.summarize" operation or if the
+        maximum count of guardrail guard calls is reached. The collected calls are stored
         in a list of dictionaries, each containing the input prompt, outputs, and score.
         Returns:
         Renders the collected guardrail guard calls into a pandas DataFrame suitable for
         display in Streamlit.
+        This function processes the collected guardrail guard calls stored in `self.call_list` and
+        organizes them into a dictionary format that can be easily converted into a pandas DataFrame.
+        The DataFrame contains columns for the input prompts, the safety status of the outputs, and
         the correctness of the predictions for each guardrail.
         The structure of the DataFrame is as follows:
         - Subsequent columns contain the safety status and prediction correctness for each guardrail.
         Returns:
+            pd.DataFrame: A DataFrame containing the input prompts, safety status, and prediction
                           correctness for each guardrail.
         """
         dataframe = {