fixing tests

Dmitryv-2024 · Dmitryv-2024 · commit 5c0720525cc8 · 2024-12-29T23:23:21.000+04:00
diff --git a/autointent/_transformers/_nli_transformer.py b/autointent/_transformers/_nli_transformer.py
@@ -97,6 +97,7 @@ def __init__(
         train_classifier: bool = False,
         batch_size: int = 326,
         max_length: int | None = None,
+        classifier_head: LogisticRegressionCV | None = None,
     ) -> None:
         """
         Initialize the NLITransformer.
@@ -106,14 +107,16 @@ def __init__(
         :param train_classifier: Whether to train a custom classifier, defaults to False.
         :param batch_size: Batch size for processing text pairs, defaults to 326.
         :param max_length (int, optional): Max length for input sequences for the cross encoder.
+        :param classifier_head (LogisticRegressionCV, optional): Classifier (to be used in restore procedure mainly).
         """
         self.cross_encoder = CrossEncoder(model, trust_remote_code=True, device=device, max_length=max_length)  # type: ignore[arg-type]
-        self.train_classifier = train_classifier
+        self.train_classifier = False
         self.batch_size = batch_size
         self.max_length = max_length
-        self._clf = None
+        self._clf = classifier_head
 
-        if train_classifier:
+        if classifier_head is not None or train_classifier:
+            self.train_classifier = True
             self._logits_list: list[npt.NDArray[Any]] = []
             self._hook_handler = self.cross_encoder.model.classifier.register_forward_hook(self._classifier_hook)
 
@@ -188,7 +191,7 @@ def predict(self, pairs: list[list[str]]) -> npt.NDArray[Any]:
         features = self.get_features(pairs)
 
         if self._clf is not None:
-            return self._clf.predict_proba(features)[:, 1]
+            return np.array(self._clf.predict_proba(features)[:, 1])
 
         return features
 
@@ -230,17 +233,6 @@ def save(self, path: str) -> None:
         clf_path = dump_dir / "classifier.joblib"
         joblib.dump(self._clf, clf_path)
 
-    def set_classifier(self, clf: LogisticRegressionCV) -> None:
-        """
-        Set the logistic regression classifier.
-
-        :param clf: LogisticRegressionCV instance.
-        """
-        self._clf = clf
-
-        if clf is None:
-            self.train_classifier = False
-
     @classmethod
     def load(cls, path: str) -> "NLITransformer":
         """
@@ -257,9 +249,5 @@ def load(cls, path: str) -> "NLITransformer":
 
         # Load sentence transformer model
         crossencoder_dir = str(dump_dir / "crossencoder")
-        model = CrossEncoder(crossencoder_dir)
-
-        res = cls(model)
-        res.set_classifier(clf)
 
-        return res
+        return cls(crossencoder_dir, classifier_head=clf)
diff --git a/tests/_transformers/test_nli_transformer.py b/tests/_transformers/test_nli_transformer.py
@@ -14,7 +14,7 @@ def data_handler():
 
 
 def test_nli_transformer_predict_without_trained_head(data_handler):
-    model = NLITransformer(model="cross-encoder/ms-marco-MiniLM-L-6-v2", device="cuda", train_classifier=True)
+    model = NLITransformer(model="cross-encoder/ms-marco-MiniLM-L-6-v2", device="cpu", train_classifier=True)
     with pytest.raises(ValueError, match="Classifier is not trained yet"):
         model.predict(data_handler.train_utterances())
 
@@ -49,7 +49,7 @@ def check_ranking(ranked, labels):
 
 
 def test_nli_transformer_predict_with_train_head(data_handler):
-    model = NLITransformer(model="cross-encoder/ms-marco-MiniLM-L-6-v2", device="cuda", train_classifier=True)
+    model = NLITransformer(model="cross-encoder/ms-marco-MiniLM-L-6-v2", device="cpu", train_classifier=True)
     texts = data_handler.train_utterances()
     labels = data_handler.train_labels()
     model.fit(texts, labels)
@@ -61,7 +61,7 @@ def test_nli_transformer_predict_with_train_head(data_handler):
 
 
 def test_nli_transformer_predict_default(data_handler):
-    model = NLITransformer(model="cross-encoder/ms-marco-MiniLM-L-6-v2", device="cuda")
+    model = NLITransformer(model="cross-encoder/ms-marco-MiniLM-L-6-v2", device="cpu")
     texts = data_handler.train_utterances()
     labels = data_handler.train_labels()
     predicted = model.predict(build_pairs(texts))
@@ -72,7 +72,7 @@ def test_nli_transformer_predict_default(data_handler):
 
 
 def test_nli_transformer_predict_default_with_fit(data_handler):
-    model = NLITransformer(model="cross-encoder/ms-marco-MiniLM-L-6-v2", device="cuda")
+    model = NLITransformer(model="cross-encoder/ms-marco-MiniLM-L-6-v2", device="cpu")
     texts = data_handler.train_utterances()
     labels = data_handler.train_labels()
     model.fit(texts, labels)