2323from huggingface_hub .file_download import cached_download , filename_to_url , hf_hub_url
2424
2525from .testing_utils import (
26- DUMMY_UNKWOWN_IDENTIFIER ,
26+ DUMMY_MODEL_ID ,
27+ DUMMY_MODEL_ID_PINNED_SHA1 ,
28+ DUMMY_MODEL_ID_PINNED_SHA256 ,
29+ DUMMY_MODEL_ID_REVISION_INVALID ,
30+ DUMMY_MODEL_ID_REVISION_ONE_SPECIFIC_COMMIT ,
2731 SAMPLE_DATASET_IDENTIFIER ,
2832 OfflineSimulationMode ,
2933 offline ,
3034)
3135
3236
33- MODEL_ID = DUMMY_UNKWOWN_IDENTIFIER
34- # An actual model hosted on huggingface.co
37+ REVISION_ID_DEFAULT = "main"
38+ # Default branch name
3539
3640DATASET_ID = SAMPLE_DATASET_IDENTIFIER
3741# An actual dataset hosted on huggingface.co
3842
3943
40- REVISION_ID_DEFAULT = "main"
41- # Default branch name
42- REVISION_ID_ONE_SPECIFIC_COMMIT = "f2c752cfc5c0ab6f4bdec59acea69eefbee381c2"
43- # One particular commit (not the top of `main`)
44- REVISION_ID_INVALID = "aaaaaaa"
45- # This commit does not exist, so we should 404.
46-
47- PINNED_SHA1 = "d9e9f15bc825e4b2c9249e9578f884bbcb5e3684"
48- # Sha-1 of config.json on the top of `main`, for checking purposes
49- PINNED_SHA256 = "4b243c475af8d0a7754e87d7d096c92e5199ec2fe168a2ee7998e3b8e9bcb1d3"
50- # Sha-256 of pytorch_model.bin on the top of `main`, for checking purposes
51-
5244DATASET_REVISION_ID_ONE_SPECIFIC_COMMIT = "e25d55a1c4933f987c46cc75d8ffadd67f257c61"
5345# One particular commit for DATASET_ID
5446DATASET_SAMPLE_PY_FILE = "custom_squad.py"
@@ -62,10 +54,12 @@ def test_bogus_url(self):
6254
6355 def test_no_connection (self ):
6456 invalid_url = hf_hub_url (
65- MODEL_ID , filename = CONFIG_NAME , revision = REVISION_ID_INVALID
57+ DUMMY_MODEL_ID ,
58+ filename = CONFIG_NAME ,
59+ revision = DUMMY_MODEL_ID_REVISION_INVALID ,
6660 )
6761 valid_url = hf_hub_url (
68- MODEL_ID , filename = CONFIG_NAME , revision = REVISION_ID_DEFAULT
62+ DUMMY_MODEL_ID , filename = CONFIG_NAME , revision = REVISION_ID_DEFAULT
6963 )
7064 self .assertIsNotNone (cached_download (valid_url , force_download = True ))
7165 for offline_mode in OfflineSimulationMode :
@@ -78,39 +72,47 @@ def test_no_connection(self):
7872
7973 def test_file_not_found (self ):
8074 # Valid revision (None) but missing file.
81- url = hf_hub_url (MODEL_ID , filename = "missing.bin" )
75+ url = hf_hub_url (DUMMY_MODEL_ID , filename = "missing.bin" )
8276 with self .assertRaisesRegex (requests .exceptions .HTTPError , "404 Client Error" ):
8377 _ = cached_download (url )
8478
8579 def test_revision_not_found (self ):
8680 # Valid file but missing revision
87- url = hf_hub_url (MODEL_ID , filename = CONFIG_NAME , revision = REVISION_ID_INVALID )
81+ url = hf_hub_url (
82+ DUMMY_MODEL_ID ,
83+ filename = CONFIG_NAME ,
84+ revision = DUMMY_MODEL_ID_REVISION_INVALID ,
85+ )
8886 with self .assertRaisesRegex (requests .exceptions .HTTPError , "404 Client Error" ):
8987 _ = cached_download (url )
9088
9189 def test_standard_object (self ):
92- url = hf_hub_url (MODEL_ID , filename = CONFIG_NAME , revision = REVISION_ID_DEFAULT )
90+ url = hf_hub_url (
91+ DUMMY_MODEL_ID , filename = CONFIG_NAME , revision = REVISION_ID_DEFAULT
92+ )
9393 filepath = cached_download (url , force_download = True )
9494 metadata = filename_to_url (filepath )
95- self .assertEqual (metadata , (url , f'"{ PINNED_SHA1 } "' ))
95+ self .assertEqual (metadata , (url , f'"{ DUMMY_MODEL_ID_PINNED_SHA1 } "' ))
9696
9797 def test_standard_object_rev (self ):
9898 # Same object, but different revision
9999 url = hf_hub_url (
100- MODEL_ID , filename = CONFIG_NAME , revision = REVISION_ID_ONE_SPECIFIC_COMMIT
100+ DUMMY_MODEL_ID ,
101+ filename = CONFIG_NAME ,
102+ revision = DUMMY_MODEL_ID_REVISION_ONE_SPECIFIC_COMMIT ,
101103 )
102104 filepath = cached_download (url , force_download = True )
103105 metadata = filename_to_url (filepath )
104- self .assertNotEqual (metadata [1 ], f'"{ PINNED_SHA1 } "' )
106+ self .assertNotEqual (metadata [1 ], f'"{ DUMMY_MODEL_ID_PINNED_SHA1 } "' )
105107 # Caution: check that the etag is *not* equal to the one from `test_standard_object`
106108
107109 def test_lfs_object (self ):
108110 url = hf_hub_url (
109- MODEL_ID , filename = PYTORCH_WEIGHTS_NAME , revision = REVISION_ID_DEFAULT
111+ DUMMY_MODEL_ID , filename = PYTORCH_WEIGHTS_NAME , revision = REVISION_ID_DEFAULT
110112 )
111113 filepath = cached_download (url , force_download = True )
112114 metadata = filename_to_url (filepath )
113- self .assertEqual (metadata , (url , f'"{ PINNED_SHA256 } "' ))
115+ self .assertEqual (metadata , (url , f'"{ DUMMY_MODEL_ID_PINNED_SHA256 } "' ))
114116
115117 def test_dataset_standard_object_rev (self ):
116118 url = hf_hub_url (
@@ -129,7 +131,7 @@ def test_dataset_standard_object_rev(self):
129131 # now let's download
130132 filepath = cached_download (url , force_download = True )
131133 metadata = filename_to_url (filepath )
132- self .assertNotEqual (metadata [1 ], f'"{ PINNED_SHA1 } "' )
134+ self .assertNotEqual (metadata [1 ], f'"{ DUMMY_MODEL_ID_PINNED_SHA1 } "' )
133135
134136 def test_dataset_lfs_object (self ):
135137 url = hf_hub_url (
0 commit comments