vawsgit
diff --git a/‎.github/workflows/run_pytest.yaml‎
Lines changed: 1 addition & 0 deletions b/‎.github/workflows/run_pytest.yaml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎examples/scripts/llm_comparator_demo.py‎
Lines changed: 141 additions & 0 deletions b/‎examples/scripts/llm_comparator_demo.py‎
Lines changed: 141 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 7 additions & 2 deletions b/‎pyproject.toml‎
Lines changed: 7 additions & 2 deletions
@@ -22,6 +22,7 @@ jobs:
         run: |
           python -m pip install --upgrade pip
           pip install -e ".[dev]"
+          pip install -e ".[llm]"
       - name: Test with pytest
         run: |
           coverage run -m pytest  -v -s
 
@@ -0,0 +1,141 @@
+#!/usr/bin/env python3
+"""
+LLM Comparator Demo Script
+
+This script demonstrates the LLMComparator functionality for semantic comparison
+of values using Large Language Models. The LLMComparator leverages AWS Bedrock
+models through the strands-agents library to perform intelligent comparisons
+that go beyond simple string matching.
+
+Requirements:
+- AWS credentials configured for Bedrock access
+- Environment variables for model configuration (optional)
+"""
+from stickler.comparators.llm import LLMComparator
+from stickler.comparators.exact import ExactComparator
+from stickler.comparators.levenshtein import LevenshteinComparator
+from stickler.structured_object_evaluator.models.structured_model import StructuredModel
+from stickler.structured_object_evaluator.models.comparable_field import ComparableField
+
+
+def print_section_header(title: str):
+    """Print a formatted section header."""
+    print(f"\n{'=' * 60}")
+    print(f"🔍 {title}")
+    print(f"{'=' * 60}")
+
+
+def demo_structured_model_integration():
+    """Demonstrate LLM comparator integration with StructuredModel."""
+    print_section_header("STRUCTURED MODEL INTEGRATION")
+    
+    # Define a customer model with mixed comparators
+    class CustomerAddress(StructuredModel):
+        street: str = ComparableField(
+            comparator=LLMComparator(
+                model="us.amazon.nova-lite-v1:0",
+                eval_guidelines="Consider street abbreviations equivalent (St=Street, Ave=Avenue, etc.)"
+            ),
+            threshold=0.8,
+            weight=1.0
+        )
+        city: str = ComparableField(
+            comparator=LevenshteinComparator(),
+            threshold=0.9,
+            weight=1.0
+        )
+        zip_code: str = ComparableField(
+            comparator=ExactComparator(),
+            threshold=1.0,
+            weight=1.0
+        )
+    
+    class Customer(StructuredModel):
+        name: str = ComparableField(
+            comparator=ExactComparator(),
+            threshold=0.8,
+            weight=1.0
+        )
+        email: str = ComparableField(
+            comparator=ExactComparator(),
+            threshold=1.0,
+            weight=1.0
+        )
+        address: CustomerAddress = ComparableField(
+            comparator=ExactComparator(),
+            threshold=1.0,
+            weight=1.0
+        )
+    
+    print("Comparing customer records with mixed comparator types...")
+    
+    # Ground truth customer
+    gt_customer = Customer(
+        name="Robert Johnson",
+        email="robert.johnson@email.com",
+        address=CustomerAddress(
+            street="123 Main Street",
+            city="Seattle",
+            zip_code="98101"
+        )
+    )
+    
+    # Predicted customer with variations
+    pred_customer = Customer(
+        name="Robert Johnson", 
+        email="robert.johnson@email.com",
+        address=CustomerAddress(
+            street="123 Main St",  # Street abbreviation
+            city="Seattle",
+            zip_code="98101"
+        )
+    )
+    
+    # Compare the customers
+    result = gt_customer.compare_with(pred_customer, include_confusion_matrix=True)
+        
+    # Show field-level results
+    print("\nField-level comparison results:")
+    cm = result['confusion_matrix']
+    for field_name, field_data in cm['fields'].items():
+        field_result = field_data['overall']
+        print(f"   {field_name}: {field_result}")
+
+
+def main():
+    """Run all demonstration functions."""
+    print("🚀 LLM COMPARATOR COMPREHENSIVE DEMO")
+    print("=" * 60)
+    print("This demo showcases the LLMComparator functionality for")
+    print("semantic comparison using Large Language Models.")
+    
+    # Check for required environment setup
+    print("\n📋 Environment Check:")
+    
+    try:
+  
+        demo_structured_model_integration()
+     
+        print_section_header("DEMO COMPLETE")
+        print("✅ All demonstrations completed successfully!")
+        print("\n💡 Key Takeaways:")
+        print("   • LLMComparator provides semantic comparison beyond string matching")
+        print("   • Integrates seamlessly with StructuredModel for complex objects")
+        
+        print("\n🔧 Best Practices:")
+        print("   • Use specific guidelines for better accuracy")
+        print("   • Choose appropriate models for your use case")
+        print("   • Handle None values and edge cases")
+        print("   • Monitor API costs and latency")
+        print("   • Test with representative data")
+        
+    except Exception as e:
+        print(f"\n❌ Demo failed with error: {e}")
+        print("Please check your AWS credentials and model access.")
+        return 1
+    
+    return 0
+
+
+if __name__ == "__main__":
+    exit(main())
@@ -12,10 +12,10 @@ readme = "README.md"
 requires-python = ">=3.12"
 
 dependencies = [
-    "pydantic>=2.11.0",
+    "pydantic>=2.11.0,<3.0.0",
     "rapidfuzz>=3.0.0",
     "munkres>=1.1.4",
-    "numpy>=1.24.0",
+    "numpy>=1.24.0,<=2.3.3",
     "scipy>=1.10.0",
     "psutil>=5.8.0",
     "pandas>=1.5.0",
@@ -30,6 +30,11 @@ dev = [
     "beautifulsoup4>=4.14.2"
 ]
 
+llm = [
+    "strands-agents>=1.0.0,<=1.16.0",
+    "jinja2>=3.0.0,<=3.1.6"
+]
+
 
 [tool.setuptools]
 package-dir = {"" = "src"}