feat(#932): label models now modify the prediction_agent when calling…

… LabelModel.predict (#1049) * feat: add prediction agent * test: add asserts (cherry picked from commit 867f377)
argilla-io · Feb 2, 2022 · 4a024ee · 4a024ee
1 parent eb958bf
commit 4a024ee
Show file tree

Hide file tree

Showing 2 changed files with 12 additions and 0 deletions.
diff --git a/src/rubrix/labeling/text_classification/label_models.py b/src/rubrix/labeling/text_classification/label_models.py
@@ -73,13 +73,15 @@ def predict(
         self,
         include_annotated_records: bool = False,
         include_abstentions: bool = False,
+        prediction_agent: str = "LabelModel",
         **kwargs,
     ) -> List[TextClassificationRecord]:
         """Applies the label model.
 
         Args:
             include_annotated_records: Whether or not to include annotated records.
             include_abstentions: Whether or not to include records in the output, for which the label model abstained.
+            prediction_agent: String used for the ``prediction_agent`` in the returned records.
 
         Returns:
             A list of records that include the predictions of the label model.
@@ -282,13 +284,15 @@ def predict(
         self,
         include_annotated_records: bool = False,
         include_abstentions: bool = False,
+        prediction_agent: str = "Snorkel",
         tie_break_policy: Union[TieBreakPolicy, str] = "abstain",
     ) -> List[TextClassificationRecord]:
         """Returns a list of records that contain the predictions of the label model
 
         Args:
             include_annotated_records: Whether or not to include annotated records.
             include_abstentions: Whether or not to include records in the output, for which the label model abstained.
+            prediction_agent: String used for the ``prediction_agent`` in the returned records.
             tie_break_policy: Policy to break ties. You can choose among three policies:
 
                 - `abstain`: Do not provide any prediction
@@ -355,6 +359,7 @@ def predict(
                 ]
 
             records_with_prediction[-1].prediction = pred_for_rec
+            records_with_prediction[-1].prediction_agent = prediction_agent
 
         return records_with_prediction
 
@@ -537,6 +542,7 @@ def predict(
         self,
         include_annotated_records: bool = False,
         include_abstentions: bool = False,
+        prediction_agent: str = "FlyingSquid",
         verbose: bool = True,
         tie_break_policy: str = "abstain",
     ) -> List[TextClassificationRecord]:
@@ -545,6 +551,7 @@ def predict(
         Args:
             include_annotated_records: Whether or not to include annotated records.
             include_abstentions: Whether or not to include records in the output, for which the label model abstained.
+            prediction_agent: String used for the ``prediction_agent`` in the returned records.
             verbose: If True, print out messages of the progress to stderr.
             tie_break_policy: Policy to break ties. You can choose among two policies:
 
@@ -618,6 +625,7 @@ def predict(
 
             records_with_prediction.append(rec.copy(deep=True))
             records_with_prediction[-1].prediction = pred_for_rec
+            records_with_prediction[-1].prediction_agent = prediction_agent
 
         return records_with_prediction
 

diff --git a/tests/labeling/text_classification/test_label_models.py b/tests/labeling/text_classification/test_label_models.py
@@ -259,6 +259,7 @@ def mock_predict(self, L, return_probs, tie_break_policy, *args, **kwargs):
             tie_break_policy=policy,
             include_annotated_records=include_annotated_records,
             include_abstentions=include_abstentions,
+            prediction_agent="mock_agent",
         )
         assert len(records) == expected[0]
         assert [
@@ -267,6 +268,7 @@ def mock_predict(self, L, return_probs, tie_break_policy, *args, **kwargs):
         assert [
             rec.prediction[0][1] if rec.prediction else None for rec in records
         ] == expected[2]
+        assert records[0].prediction_agent == "mock_agent"
 
     @pytest.mark.parametrize("policy,expected", [("abstain", 0.5), ("random", 2.0 / 3)])
     def test_score(self, monkeypatch, weak_labels, policy, expected):
@@ -455,12 +457,14 @@ def __call__(cls, L_matrix, verbose):
             include_annotated_records=include_annotated_records,
             include_abstentions=include_abstentions,
             verbose=verbose,
+            prediction_agent="mock_agent",
         )
 
         assert MockPredict.calls_count == 3
         assert len(records) == expected["nr_of_records"]
         if records:
             assert records[0].prediction == expected["prediction"]
+            assert records[0].prediction_agent == "mock_agent"
 
     def test_predict_binary(self, monkeypatch, weak_labels):
         class MockPredict: