fix typing errors

voorhs · voorhs · commit 31fa6e80b11b · 2025-11-19T17:58:49.000+03:00
diff --git a/src/autointent/_wrappers/embedder/hashing_vectorizer.py b/src/autointent/_wrappers/embedder/hashing_vectorizer.py
@@ -67,7 +67,7 @@ def get_hash(self) -> int:
         hasher.update(self.config.norm if self.config.norm is not None else "None")
         hasher.update(self.config.binary)
         hasher.update(self.config.dtype)
-        return hasher.hexdigest()
+        return int(hasher.hexdigest(), 16)
 
     @overload
     def embed(
@@ -97,7 +97,7 @@ def embed(
         """
         # Transform texts to sparse matrix, then convert to dense
         embeddings_sparse = self._vectorizer.transform(utterances)
-        embeddings = embeddings_sparse.toarray().astype(np.float32)
+        embeddings: npt.NDArray[np.float32] = embeddings_sparse.toarray().astype(np.float32)
 
         if return_tensors:
             return torch.from_numpy(embeddings)
@@ -115,7 +115,8 @@ def similarity(
         Returns:
             Similarity matrix with shape (n_samples, m_samples).
         """
-        return cosine_similarity(embeddings1, embeddings2).astype(np.float32)
+        similarity_matrix: npt.NDArray[np.float32] = cosine_similarity(embeddings1, embeddings2).astype(np.float32)
+        return similarity_matrix
 
     def dump(self, path: Path) -> None:
         """Save the backend state to disk.
@@ -157,7 +158,7 @@ def load(cls, path: Path) -> "HashingVectorizerEmbeddingBackend":
         logger.debug("Loaded HashingVectorizer backend from %s", path)
         return instance
 
-    def train(self, utterances: list[str], labels: list[int], config) -> None:  # noqa: ANN001
+    def train(self, utterances: list[str], labels: list[int], config) -> None:  # noqa: ANN001  # type: ignore[no-untyped-def]
         """Train the backend.
 
         HashingVectorizer is stateless and doesn't support training.