ragas: bump ragas version, pass old rubric in RubricScore

alimaredia · alimaredia · commit 46b86fd8a93f · 2025-01-17T11:26:56.000-05:00
Before ragas v0.2.11 RubricScores.rubrics wasn't
being applied properly. This commit sets that
as the minimum version for this library.

A change in v0.2.11 from previous versions was a
change in the prompt for domain specific knowledge
evaluation with reference. The prompt from previous
versions is now explicitly passed in.

Signed-off-by: Ali Maredia &lt;amaredia@redhat.com&gt;
diff --git a/requirements.txt b/requirements.txt
@@ -10,4 +10,4 @@ pandas
 pandas-stubs
 lm-eval>=0.4.4
 httpx
-ragas
+ragas>=0.2.11
diff --git a/src/instructlab/eval/ragas.py b/src/instructlab/eval/ragas.py
@@ -12,8 +12,8 @@
 from ragas.evaluation import EvaluationDataset, EvaluationResult, RunConfig, evaluate
 from ragas.metrics import Metric
 from ragas.metrics._domain_specific_rubrics import (  # the rubrics we must instantiate are located inside of a file marked as private
-    DEFAULT_WITH_REFERENCE_RUBRICS,
     RubricsScore,
+    SingleTurnPrompt,
 )
 
 # Local
@@ -22,6 +22,14 @@
 
 logger = setup_logger(__name__)
 
+OLD_DEFAULT_WITH_REFERENCE_RUBRICS = {
+    "score1_description": "The response is incorrect, irrelevant, or does not align with the ground truth.",
+    "score2_description": "The response partially matches the ground truth but includes significant errors, omissions, or irrelevant information.",
+    "score3_description": "The response generally aligns with the ground truth but may lack detail, clarity, or have minor inaccuracies.",
+    "score4_description": "The response is mostly accurate and aligns well with the ground truth, with only minor issues or missing details.",
+    "score5_description": "The response is fully accurate, aligns completely with the ground truth, and is clear and detailed.",
+}
+
 
 class Sample(TypedDict):
     """
@@ -256,9 +264,8 @@ def _generate_answers_from_model(
 
     @staticmethod
     def _get_metrics() -> List[Metric]:
-        # default set of metrics
         return [
             RubricsScore(
-                rubrics=DEFAULT_WITH_REFERENCE_RUBRICS,
+                rubrics=OLD_DEFAULT_WITH_REFERENCE_RUBRICS,
             )
         ]