update convert script

michaelfeil · michaelfeil · commit 4d153ed3026c · 2025-07-03T21:50:13.000Z
diff --git a/docs/lm_head_to_classifier/convert_lm.py b/docs/lm_head_to_classifier/convert_lm.py
@@ -8,7 +8,7 @@
     AutoTokenizer,
     AutoModelForSequenceClassification,
 )
-
+BASE_NAME = "michaelfeil"
 
 @torch.no_grad()
 def convert_to_sequence_classifier(
@@ -81,14 +81,28 @@ def as_no_id_yes_id(
     assert len(no_id_yes_id[1]) == 1
     return no_id_yes_id[0][0], no_id_yes_id[1][0]
 
+def only_yes_id(
+    model_name: str = "mixedbread-ai/mxbai-rerank-base-v2",
+    yes: str = "1",
+) -> tuple[int]:
+    """Get the id of the yes token."""
+    tokenizer = AutoTokenizer.from_pretrained(model_name)
+    yes_id = tokenizer(yes).input_ids
+    assert len(yes_id) == 1
+    return (yes_id[0],)
+
 
 def upload_and_convert(
     model_name: str = "mixedbread-ai/mxbai-rerank-base-v2",
     no: str = "0",
     yes: str = "1",
+    uses_no_and_yes: bool = True,
 ):
     """Upload the converted sequence classifier to the hub."""
-    no_id_yes_id = as_no_id_yes_id(model_name, yes, no)
+    if not uses_no_and_yes:
+        no_id_yes_id = only_yes_id(model_name, yes)
+    else:
+        no_id_yes_id = as_no_id_yes_id(model_name, yes, no)
     split_name = model_name.split("/")[1]
     model_cls = convert_to_sequence_classifier(f"{model_name}", no_id_yes_id)
     model_cls = model_cls.to(torch.float16)
@@ -99,9 +113,9 @@ def upload_and_convert(
     model_cls.save_pretrained(f"./{split_name}")
 
     api = HfApi()
-    api.create_repo(repo_id=f"michaelfeil/{split_name}-seq", exist_ok=True)
+    api.create_repo(repo_id=f"{BASE_NAME}/{split_name}-seq", exist_ok=True)
     api.upload_folder(
-        repo_id=f"michaelfeil/{split_name}-seq",
+        repo_id=f"{BASE_NAME}/{split_name}-seq",
         folder_path=f"./{split_name}",
     )