Skip to content

Commit fffdf82

Browse files
sijunhewj-Mcat
andauthored
Support HUGGINGFACE_HUB_CACHE in HF hub download through os env (#3911)
* support hf hub cache * merge conflict Co-authored-by: 骑马小猫 <[email protected]>
1 parent 3008246 commit fffdf82

File tree

4 files changed

+8
-7
lines changed

4 files changed

+8
-7
lines changed

paddlenlp/transformers/auto/tokenizer.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@
2424
from paddlenlp.transformers import *
2525
from paddlenlp.utils.downloader import (COMMUNITY_MODEL_PREFIX,
2626
get_path_from_url)
27-
from paddlenlp.utils.env import MODEL_HOME
27+
from paddlenlp.utils.env import HF_CACHE_HOME
2828
from paddlenlp.utils.import_utils import is_fast_tokenizer_available
2929
from paddlenlp.utils.log import logger
3030

@@ -243,7 +243,7 @@ def from_pretrained(cls,
243243
if from_hf_hub:
244244
config_file = hf_hub_download(repo_id=pretrained_model_name_or_path,
245245
filename=cls.tokenizer_config_file,
246-
cache_dir=MODEL_HOME,
246+
cache_dir=HF_CACHE_HOME,
247247
library_name="PaddleNLP",
248248
library_version=__version__)
249249
if os.path.exists(config_file):

paddlenlp/transformers/configuration_utils.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@
3131

3232
from paddlenlp import __version__
3333
from paddlenlp.transformers.utils import resolve_cache_dir
34-
from paddlenlp.utils.env import MODEL_HOME
34+
from paddlenlp.utils.env import HF_CACHE_HOME
3535
from paddlenlp.utils.log import logger
3636

3737
from ..utils import CONFIG_NAME
@@ -748,7 +748,7 @@ def _get_config_dict(cls, pretrained_model_name_or_path: Union[str,
748748
resolved_config_file = hf_hub_download(
749749
repo_id=pretrained_model_name_or_path,
750750
filename=CONFIG_NAME,
751-
cache_dir=MODEL_HOME,
751+
cache_dir=HF_CACHE_HOME,
752752
library_name="PaddleNLP",
753753
library_version=__version__)
754754

paddlenlp/transformers/model_utils.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@
3535
from paddlenlp import __version__
3636
from paddlenlp.utils.downloader import (COMMUNITY_MODEL_PREFIX, download_check,
3737
get_path_from_url_with_filelock)
38-
from paddlenlp.utils.env import LOCK_FILE_HOME, MODEL_HOME
38+
from paddlenlp.utils.env import HF_CACHE_HOME, LOCK_FILE_HOME, MODEL_HOME
3939
from paddlenlp.utils.file_lock import FileLock
4040
from paddlenlp.utils.log import logger
4141

@@ -440,7 +440,7 @@ def from_pretrained(cls,
440440
resolved_resource_files[file_id] = hf_hub_download(
441441
repo_id=pretrained_model_name_or_path,
442442
filename=file_path,
443-
cache_dir=MODEL_HOME,
443+
cache_dir=HF_CACHE_HOME,
444444
library_name="PaddleNLP",
445445
library_version=__version__)
446446
else:
@@ -851,7 +851,7 @@ def _resolve_model_file_path(cls: Type[PretrainedModel],
851851
return hf_hub_download(
852852
repo_id=pretrained_model_name_or_path,
853853
filename=cls.resource_files_names['model_state'],
854-
cache_dir=MODEL_HOME,
854+
cache_dir=HF_CACHE_HOME,
855855
library_name="PaddleNLP",
856856
library_version=__version__)
857857

paddlenlp/utils/env.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -50,6 +50,7 @@ def _get_sub_home(directory, parent_home=_get_ppnlp_home()):
5050
USER_HOME = _get_user_home()
5151
PPNLP_HOME = _get_ppnlp_home()
5252
MODEL_HOME = _get_sub_home('models')
53+
HF_CACHE_HOME = os.environ.get('HUGGINGFACE_HUB_CACHE', MODEL_HOME)
5354
DATA_HOME = _get_sub_home('datasets')
5455
LOCK_FILE_HOME = _get_sub_home(".lock")
5556
DOWNLOAD_SERVER = "http://paddlepaddle.org.cn/paddlehub"

0 commit comments

Comments
 (0)