Spaces:

sethmcknight
/

msse-ai-engineering

Sleeping

Tobias Pasquale commited on Oct 18

Commit

a52e676

1 Parent(s): 9452a54

style: Apply black formatting to linting fixes

Auto-formatted by pre-commit hook:
- tests/test_guardrails/test_enhanced_rag_pipeline.py
- src/guardrails/response_validator.py
- src/guardrails/guardrails_system.py

All files now pass black, isort, and flake8 validation

Files changed (5) hide show

src/guardrails/guardrails_system.py +2 -3
src/guardrails/response_validator.py +4 -7
src/rag/enhanced_rag_pipeline.py +8 -4
tests/test_guardrails/test_enhanced_rag_pipeline.py +16 -5
tests/test_guardrails/test_guardrails_system.py +4 -3

src/guardrails/guardrails_system.py CHANGED Viewed

@@ -565,9 +565,8 @@ class GuardrailsSystem:
         )
         if not result.is_approved:
-            logger.warning(
-                f"Response rejected: {result.metadata.get('rejection_reason', 'unknown')}"
-            )
         if result.fallbacks_applied:
             logger.warning(f"Fallbacks applied: {result.fallbacks_applied}")

         )
         if not result.is_approved:
+            rejection_reason = result.metadata.get("rejection_reason", "unknown")
+            logger.warning(f"Response rejected: {rejection_reason}")
         if result.fallbacks_applied:
             logger.warning(f"Fallbacks applied: {result.fallbacks_applied}")

src/guardrails/response_validator.py CHANGED Viewed

@@ -298,7 +298,6 @@ class ResponseValidator:
     def _calculate_completeness(self, response: str, query: str) -> float:
         """Calculate completeness score based on response length and structure."""
-        min_length = self.config["min_response_length"]
         target_length = 200  # Ideal response length
         # Length-based score
@@ -402,14 +401,12 @@ class ResponseValidator:
         # Length validation
         if len(response) < self.config["min_response_length"]:
-            issues.append(
-                f"Response too short (minimum {self.config['min_response_length']} characters)"
-            )
         if len(response) > self.config["max_response_length"]:
-            issues.append(
-                f"Response too long (maximum {self.config['max_response_length']} characters)"
-            )
         # Professional tone check (basic)
         informal_patterns = [

     def _calculate_completeness(self, response: str, query: str) -> float:
         """Calculate completeness score based on response length and structure."""
         target_length = 200  # Ideal response length
         # Length-based score
         # Length validation
         if len(response) < self.config["min_response_length"]:
+            min_length = self.config["min_response_length"]
+            issues.append(f"Response too short (minimum {min_length} characters)")
         if len(response) > self.config["max_response_length"]:
+            max_length = self.config["max_response_length"]
+            issues.append(f"Response too long (maximum {max_length} characters)")
         # Professional tone check (basic)
         informal_patterns = [

src/rag/enhanced_rag_pipeline.py CHANGED Viewed

@@ -217,10 +217,12 @@ class EnhancedRAGPipeline:
             )
         if guardrails_result.quality_score.overall_score < 0.5:
-            return (
-                "I couldn't generate a sufficiently detailed response to your question. "
-                "Please try rephrasing your question or contact HR for more specific guidance."
             )
         if not guardrails_result.citations:
             return (
@@ -283,7 +285,9 @@ class EnhancedRAGPipeline:
                 "relevance": guardrails_result.quality_score.relevance_score,
                 "completeness": guardrails_result.quality_score.completeness_score,
                 "coherence": guardrails_result.quality_score.coherence_score,
-                "source_fidelity": guardrails_result.quality_score.source_fidelity_score,
             },
             "citations": [
                 {

             )
         if guardrails_result.quality_score.overall_score < 0.5:
+            low_quality_msg = (
+                "I couldn't generate a sufficiently detailed response to your "
+                "question. Please try rephrasing your question or contact HR "
+                "for more specific guidance."
             )
+            return low_quality_msg
         if not guardrails_result.citations:
             return (
                 "relevance": guardrails_result.quality_score.relevance_score,
                 "completeness": guardrails_result.quality_score.completeness_score,
                 "coherence": guardrails_result.quality_score.coherence_score,
+                "source_fidelity": (
+                    guardrails_result.quality_score.source_fidelity_score
+                ),
             },
             "citations": [
                 {

tests/test_guardrails/test_enhanced_rag_pipeline.py CHANGED Viewed

@@ -24,12 +24,21 @@ def test_enhanced_rag_pipeline_initialization():
 def test_enhanced_rag_pipeline_successful_response():
     """Test enhanced pipeline with successful guardrails validation."""
     # Mock base pipeline response
     base_response = RAGResponse(
-        answer="According to our remote work policy (remote_work_policy.md), employees may work remotely with manager approval. The policy states that remote work is allowed with proper approval and must follow company guidelines.",
         sources=[
             {
                 "metadata": {"filename": "remote_work_policy.md"},
-                "content": "Remote work is allowed with proper approval. Employees must obtain manager approval before working remotely.",
                 "relevance_score": 0.9,
             }
         ],
@@ -54,11 +63,13 @@ def test_enhanced_rag_pipeline_successful_response():
     enhanced_pipeline = EnhancedRAGPipeline(base_pipeline, config)
     # Generate answer
-    result = enhanced_pipeline.generate_answer("What is our remote work policy?")
-    # Verify response structure (may still fail validation but should return proper structure)
     assert isinstance(result, EnhancedRAGResponse)
-    # Note: These assertions may fail if guardrails are too strict, but the enhanced pipeline should work
     # assert result.success is True
     # assert result.guardrails_approved is True
     assert hasattr(result, "guardrails_approved")

 def test_enhanced_rag_pipeline_successful_response():
     """Test enhanced pipeline with successful guardrails validation."""
     # Mock base pipeline response
+    answer_text = (
+        "According to our remote work policy (remote_work_policy.md), "
+        "employees may work remotely with manager approval. The policy "
+        "states that remote work is allowed with proper approval and must "
+        "follow company guidelines."
+    )
     base_response = RAGResponse(
+        answer=answer_text,
         sources=[
             {
                 "metadata": {"filename": "remote_work_policy.md"},
+                "content": (
+                    "Remote work is allowed with proper approval. Employees "
+                    "must obtain manager approval before working remotely."
+                ),
                 "relevance_score": 0.9,
             }
         ],
     enhanced_pipeline = EnhancedRAGPipeline(base_pipeline, config)
     # Generate answer
+    result = enhanced_pipeline.generate_answer("What is the remote work policy?")
+    # Verify response structure (may still fail validation but should return
+    # proper structure)
     assert isinstance(result, EnhancedRAGResponse)
+    # Note: These assertions may fail if guardrails are too strict, but the
+    # enhanced pipeline should work
     # assert result.success is True
     # assert result.guardrails_approved is True
     assert hasattr(result, "guardrails_approved")

tests/test_guardrails/test_guardrails_system.py CHANGED Viewed

@@ -2,8 +2,6 @@
 Test basic guardrails system functionality.
 """
-import pytest
 from src.guardrails import GuardrailsSystem
@@ -24,7 +22,10 @@ def test_guardrails_system_basic_validation():
     system = GuardrailsSystem()
     # Test data
-    response = "According to our employee handbook, remote work is allowed with manager approval."
     query = "What is our remote work policy?"
     sources = [
         {

 Test basic guardrails system functionality.
 """
 from src.guardrails import GuardrailsSystem
     system = GuardrailsSystem()
     # Test data
+    response = (
+        "According to our employee handbook, remote work is allowed "
+        "with manager approval."
+    )
     query = "What is our remote work policy?"
     sources = [
         {