feat / fix: Properly make use of subfolder from HF models (#3072)

younesbelkada · baberabb · web-flow · commit 6b3f3f7e2aec · 2025-06-25T16:02:57.000+05:00
* add subfolder

* lint

* change it to empty string

* fix typehints

---------

Co-authored-by: Baber &lt;baber@hey.com&gt;
diff --git a/lm_eval/models/huggingface.py b/lm_eval/models/huggingface.py
@@ -61,7 +61,7 @@ def __init__(
         backend: Literal["default", "causal", "seq2seq"] = "default",
         # override whether the model should be treated as decoder-only (causal) or encoder-decoder (seq2seq)
         revision: Optional[str] = "main",
-        subfolder: Optional[str] = None,
+        subfolder: str = "",
         tokenizer: Optional[
             Union[
                 str,
@@ -162,14 +162,13 @@ def __init__(
                 )
 
             revision = str(revision)  # cast to string if not already one
-            # TODO: update this to be less of a hack once subfolder is fixed in HF
-            revision = revision + ("/" + subfolder if subfolder is not None else "")
 
             self._get_config(
                 pretrained,
                 revision=revision,
                 trust_remote_code=trust_remote_code,
                 gguf_file=gguf_file,
+                subfolder=subfolder,
             )
 
             # determine which of 'causal' and 'seq2seq' backends to use for HF models
@@ -182,6 +181,7 @@ def __init__(
             pretrained,
             tokenizer,
             revision=revision,
+            subfolder=subfolder,
             trust_remote_code=trust_remote_code,
             use_fast_tokenizer=use_fast_tokenizer,
             gguf_file=gguf_file,
@@ -206,6 +206,7 @@ def __init__(
                 gptqmodel=gptqmodel,
                 gguf_file=gguf_file,
                 quantization_config=getattr(self.config, "quantization_config", None),
+                subfolder=subfolder,
                 **kwargs,
             )
 
@@ -522,13 +523,15 @@ def _get_config(
         revision: str = "main",
         trust_remote_code: bool = False,
         gguf_file: Optional[str] = None,
+        subfolder: str = "",
     ) -> None:
         """Return the model config for HuggingFace models"""
         self._config = transformers.AutoConfig.from_pretrained(
             pretrained,
             revision=revision,
             trust_remote_code=trust_remote_code,
             gguf_file=gguf_file,
+            subfolder=subfolder,
         )
 
     def _create_model(
@@ -552,6 +555,7 @@ def _create_model(
         gptqmodel: Optional[bool] = False,
         gguf_file: Optional[str] = None,
         quantization_config: Optional[Dict[str, Any]] = None,
+        subfolder: str = "",
         **kwargs,
     ) -> None:
         """
@@ -598,6 +602,7 @@ def _create_model(
                 trust_remote_code=trust_remote_code,
                 gguf_file=gguf_file,
                 quantization_config=quantization_config,
+                subfolder=subfolder,
                 **model_kwargs,
             )
         else:
@@ -697,6 +702,7 @@ def _create_tokenizer(
         use_fast_tokenizer: Optional[bool] = True,
         gguf_file: Optional[str] = None,
         add_bos_token: Optional[bool] = False,
+        subfolder: Optional[str] = "",
     ) -> None:
         """
         Helper method during initialization.
@@ -718,6 +724,9 @@ def _create_tokenizer(
         if add_bos_token:
             kwargs["add_bos_token"] = True
 
+        if subfolder:
+            kwargs["subfolder"] = subfolder
+
         if tokenizer:
             if isinstance(tokenizer, str):
                 self.tokenizer = transformers.AutoTokenizer.from_pretrained(