Fix broken PromptScorer/Classifier Scorer UTs. Pydantic attribute issues are resolved and now UTs pass.

SecroLoL · SecroLoL · commit caeaa0b8051f · 2025-01-01T19:14:35.000-08:00
diff --git a/judgeval/scorers/prompt_scorer.py b/judgeval/scorers/prompt_scorer.py
@@ -47,6 +47,10 @@ class PromptScorer(CustomScorer, BaseModel):
     score_type: str
     threshold: float = Field(default=0.5)
     using_native_model: bool = Field(default=True)
+
+    # DO NOT SET THESE FIELDS MANUALLY, THEY ARE SET BY THE SCORE_EXAMPLE METHOD
+    response: Optional[dict] = None
+    result: Optional[float] = None
     
     def __init__(
         self,
@@ -295,6 +299,7 @@ def __init__(self, name: str, slug: str, conversation: List[dict], options: Mapp
         BaseModel.__init__(
             self,
             name=name,
+            slug=slug,
             score_type=name,
             conversation=conversation,
             options=options,
diff --git a/tests/scorers/test_prompt_scorer.py b/tests/scorers/test_prompt_scorer.py
@@ -1,6 +1,7 @@
 import pytest
+from pydantic import BaseModel, Field
 from unittest.mock import MagicMock, AsyncMock
-from typing import List, Dict
+from typing import List, Dict, Any
 
 from judgeval.data import Example
 from judgeval.scorers.prompt_scorer import PromptScorer, ClassifierScorer
@@ -27,6 +28,9 @@ def mock_model():
 
 # Simple implementation of PromptScorer for testing
 class SampleScorer(PromptScorer):
+
+    model: Any = Field(default=None)
+
     def __init__(self, mock_model, *args, **kwargs):
         super().__init__(*args, **kwargs)
         self.model = mock_model
@@ -105,6 +109,7 @@ def classifier_options(self):
     def test_classifier_init(self, classifier_conversation, classifier_options):
         scorer = ClassifierScorer(
             name="test_classifier",
+            slug="test_classifier_slug",
             conversation=classifier_conversation,
             options=classifier_options
         )
@@ -114,6 +119,7 @@ def test_classifier_init(self, classifier_conversation, classifier_options):
     def test_build_measure_prompt(self, example, classifier_conversation, classifier_options):
         scorer = ClassifierScorer(
             name="test_classifier",
+            slug="test_classifier_slug",
             conversation=classifier_conversation,
             options=classifier_options
         )
@@ -124,6 +130,7 @@ def test_build_measure_prompt(self, example, classifier_conversation, classifier
     def test_process_response(self, classifier_conversation, classifier_options):
         scorer = ClassifierScorer(
             name="test_classifier",
+            slug="test_classifier_slug",
             conversation=classifier_conversation,
             options=classifier_options
         )
@@ -136,6 +143,7 @@ def test_process_response(self, classifier_conversation, classifier_options):
     def test_process_response_invalid_choice(self, classifier_conversation, classifier_options):
         scorer = ClassifierScorer(
             name="test_classifier",
+            slug="test_classifier_slug",
             conversation=classifier_conversation,
             options=classifier_options
         )
@@ -147,6 +155,7 @@ def test_process_response_invalid_choice(self, classifier_conversation, classifi
     def test_success_check(self, classifier_conversation, classifier_options):
         scorer = ClassifierScorer(
             name="test_classifier",
+            slug="test_classifier_slug",
             conversation=classifier_conversation,
             options=classifier_options
         )