Skip to content

Commit 2ab754c

Browse files
configuring hf downloads to lower memory usage (#895)
* configuring hf downloads to lower memory usage Signed-off-by: Brett Thompson <[email protected]> * update storage initializer container memory limit to 24Gi to provide buffer for model downloads Signed-off-by: Brett Thompson <[email protected]> --------- Signed-off-by: Brett Thompson <[email protected]>
1 parent 803c4c7 commit 2ab754c

File tree

6 files changed

+107
-17
lines changed

6 files changed

+107
-17
lines changed

config/overlays/odh/patches/patch-inferenceservice-config.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ data:
1717
{
1818
"image" : "$(kserve-storage-initializer)",
1919
"memoryRequest": "100Mi",
20-
"memoryLimit": "200Gi",
20+
"memoryLimit": "24Gi",
2121
"cpuRequest": "100m",
2222
"cpuLimit": "1",
2323
"enableDirectPvcVolumeMount": true,

pkg/controller/llmisvc/controller_workload_storage_int_test.go

Lines changed: 0 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -391,10 +391,6 @@ var _ = Describe("LLMInferenceService Controller - Storage configuration", func(
391391
},
392392
},
393393
},
394-
{
395-
Name: hf.HFTransfer,
396-
Value: "1",
397-
},
398394
}
399395
validateStorageInitializerCredentials(expectedMainDeployment, expectedEnvVars)
400396
validateStorageInitializerCredentials(expectedPrefillDeployment, expectedEnvVars)
@@ -1350,10 +1346,6 @@ var _ = Describe("LLMInferenceService Controller - Storage configuration", func(
13501346
},
13511347
},
13521348
},
1353-
{
1354-
Name: hf.HFTransfer,
1355-
Value: "1",
1356-
},
13571349
}
13581350
validateStorageInitializerCredentialsForLWS(expectedMainLWS, expectedEnvVars)
13591351
validateStorageInitializerCredentialsForLWS(expectedPrefillLWS, expectedEnvVars)

pkg/credentials/hf/hf_secret.go

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,6 @@ import (
2222

2323
const (
2424
HFTokenKey = "HF_TOKEN"
25-
HFTransfer = "HF_HUB_ENABLE_HF_TRANSFER"
2625
)
2726

2827
func BuildSecretEnvs(secret *corev1.Secret) []corev1.EnvVar {
@@ -41,10 +40,6 @@ func BuildSecretEnvs(secret *corev1.Secret) []corev1.EnvVar {
4140
},
4241
},
4342
},
44-
{
45-
Name: HFTransfer,
46-
Value: "1",
47-
},
4843
}...)
4944
}
5045
return envs

pkg/credentials/hf/hf_secret_test.go

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -36,12 +36,10 @@ func TestBuildSecretEnvs_WithToken(t *testing.T) {
3636

3737
envs := BuildSecretEnvs(secret)
3838

39-
assert.Len(t, envs, 2)
39+
assert.Len(t, envs, 1)
4040
assert.Equal(t, HFTokenKey, envs[0].Name)
4141
assert.Equal(t, HFTokenKey, envs[0].ValueFrom.SecretKeyRef.Key)
4242
assert.Equal(t, secret.Name, envs[0].ValueFrom.SecretKeyRef.LocalObjectReference.Name)
43-
assert.Equal(t, HFTransfer, envs[1].Name)
44-
assert.Equal(t, "1", envs[1].Value)
4543
}
4644

4745
func TestBuildSecretEnvs_WithoutToken(t *testing.T) {

pkg/utils/storage.go

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -195,6 +195,18 @@ func AddStorageInitializerContainer(podSpec *corev1.PodSpec, mainContainerName,
195195
Name: "HF_HOME",
196196
Value: "/tmp",
197197
},
198+
{
199+
Name: "HF_HUB_ENABLE_HF_TRANSFER",
200+
Value: "1",
201+
},
202+
{
203+
Name: "HF_XET_HIGH_PERFORMANCE",
204+
Value: "1",
205+
},
206+
{
207+
Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS",
208+
Value: "8",
209+
},
198210
},
199211
Resources: corev1.ResourceRequirements{
200212
Limits: map[corev1.ResourceName]resource.Quantity{

pkg/webhook/admission/pod/storage_initializer_injector_test.go

Lines changed: 93 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -187,6 +187,9 @@ func TestStorageInitializerInjector(t *testing.T) {
187187
Resources: resourceRequirement,
188188
Env: []corev1.EnvVar{
189189
{Name: "HF_HOME", Value: "/tmp"},
190+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
191+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
192+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
190193
},
191194
TerminationMessagePolicy: "FallbackToLogsOnError",
192195
VolumeMounts: []corev1.VolumeMount{
@@ -252,6 +255,9 @@ func TestStorageInitializerInjector(t *testing.T) {
252255
TerminationMessagePolicy: "FallbackToLogsOnError",
253256
Env: []corev1.EnvVar{
254257
{Name: "HF_HOME", Value: "/tmp"},
258+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
259+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
260+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
255261
},
256262
VolumeMounts: []corev1.VolumeMount{
257263
{
@@ -316,6 +322,9 @@ func TestStorageInitializerInjector(t *testing.T) {
316322
Resources: resourceRequirement,
317323
Env: []corev1.EnvVar{
318324
{Name: "HF_HOME", Value: "/tmp"},
325+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
326+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
327+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
319328
},
320329
TerminationMessagePolicy: "FallbackToLogsOnError",
321330
VolumeMounts: []corev1.VolumeMount{
@@ -381,6 +390,9 @@ func TestStorageInitializerInjector(t *testing.T) {
381390
Resources: resourceRequirement,
382391
Env: []corev1.EnvVar{
383392
{Name: "HF_HOME", Value: "/tmp"},
393+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
394+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
395+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
384396
},
385397
TerminationMessagePolicy: "FallbackToLogsOnError",
386398
VolumeMounts: []corev1.VolumeMount{
@@ -450,6 +462,9 @@ func TestStorageInitializerInjector(t *testing.T) {
450462
Resources: resourceRequirement,
451463
Env: []corev1.EnvVar{
452464
{Name: "HF_HOME", Value: "/tmp"},
465+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
466+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
467+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
453468
},
454469
TerminationMessagePolicy: "FallbackToLogsOnError",
455470
VolumeMounts: []corev1.VolumeMount{
@@ -531,6 +546,9 @@ func TestStorageInitializerInjector(t *testing.T) {
531546
Args: []string{"s3://my-bucket/foo/bar", constants.DefaultModelLocalMountPath},
532547
Env: []corev1.EnvVar{
533548
{Name: "HF_HOME", Value: "/tmp"},
549+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
550+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
551+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
534552
{
535553
Name: credentials.StorageOverrideConfigEnvKey,
536554
Value: `{"bucket":"my-bucket","type":"s3"}`,
@@ -814,6 +832,9 @@ func TestCredentialInjection(t *testing.T) {
814832
},
815833
Env: []corev1.EnvVar{
816834
{Name: "HF_HOME", Value: "/tmp"},
835+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
836+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
837+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
817838
{
818839
Name: s3.AWSAccessKeyId,
819840
ValueFrom: &corev1.EnvVarSource{
@@ -920,6 +941,9 @@ func TestCredentialInjection(t *testing.T) {
920941
},
921942
Env: []corev1.EnvVar{
922943
{Name: "HF_HOME", Value: "/tmp"},
944+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
945+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
946+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
923947
{
924948
Name: gcs.GCSCredentialEnvKey,
925949
Value: gcs.GCSCredentialVolumeMountPath + "gcloud-application-credentials.json",
@@ -1009,6 +1033,9 @@ func TestCredentialInjection(t *testing.T) {
10091033
Args: []string{"s3://my-bucket/foo/bar", constants.DefaultModelLocalMountPath},
10101034
Env: []corev1.EnvVar{
10111035
{Name: "HF_HOME", Value: "/tmp"},
1036+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
1037+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
1038+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
10121039
{
10131040
Name: credentials.StorageConfigEnvKey,
10141041
ValueFrom: &corev1.EnvVarSource{
@@ -1105,6 +1132,9 @@ func TestCredentialInjection(t *testing.T) {
11051132
Args: []string{"s3://my-bucket/foo/bar", constants.DefaultModelLocalMountPath},
11061133
Env: []corev1.EnvVar{
11071134
{Name: "HF_HOME", Value: "/tmp"},
1135+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
1136+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
1137+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
11081138
{
11091139
Name: credentials.StorageConfigEnvKey,
11101140
ValueFrom: &corev1.EnvVarSource{
@@ -1223,6 +1253,9 @@ func TestStorageInitializerConfigmap(t *testing.T) {
12231253
Resources: resourceRequirement,
12241254
Env: []corev1.EnvVar{
12251255
{Name: "HF_HOME", Value: "/tmp"},
1256+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
1257+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
1258+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
12261259
},
12271260
TerminationMessagePolicy: "FallbackToLogsOnError",
12281261
VolumeMounts: []corev1.VolumeMount{
@@ -1465,6 +1498,9 @@ func TestCaBundleConfigMapVolumeMountInStorageInitializer(t *testing.T) {
14651498
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
14661499
Env: []corev1.EnvVar{
14671500
{Name: "HF_HOME", Value: "/tmp"},
1501+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
1502+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
1503+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
14681504
{
14691505
Name: s3.AWSAccessKeyId,
14701506
ValueFrom: &corev1.EnvVarSource{
@@ -1567,6 +1603,9 @@ func TestCaBundleConfigMapVolumeMountInStorageInitializer(t *testing.T) {
15671603
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
15681604
Env: []corev1.EnvVar{
15691605
{Name: "HF_HOME", Value: "/tmp"},
1606+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
1607+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
1608+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
15701609
{
15711610
Name: s3.AWSAccessKeyId,
15721611
ValueFrom: &corev1.EnvVarSource{
@@ -1688,6 +1727,9 @@ func TestCaBundleConfigMapVolumeMountInStorageInitializer(t *testing.T) {
16881727
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
16891728
Env: []corev1.EnvVar{
16901729
{Name: "HF_HOME", Value: "/tmp"},
1730+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
1731+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
1732+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
16911733
{
16921734
Name: s3.AWSAccessKeyId,
16931735
ValueFrom: &corev1.EnvVarSource{
@@ -1811,6 +1853,9 @@ func TestCaBundleConfigMapVolumeMountInStorageInitializer(t *testing.T) {
18111853
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
18121854
Env: []corev1.EnvVar{
18131855
{Name: "HF_HOME", Value: "/tmp"},
1856+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
1857+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
1858+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
18141859
{
18151860
Name: s3.AWSAccessKeyId,
18161861
ValueFrom: &corev1.EnvVarSource{
@@ -1927,6 +1972,9 @@ func TestCaBundleConfigMapVolumeMountInStorageInitializer(t *testing.T) {
19271972
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
19281973
Env: []corev1.EnvVar{
19291974
{Name: "HF_HOME", Value: "/tmp"},
1975+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
1976+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
1977+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
19301978
{
19311979
Name: s3.AWSAccessKeyId,
19321980
ValueFrom: &corev1.EnvVarSource{
@@ -2034,6 +2082,9 @@ func TestCaBundleConfigMapVolumeMountInStorageInitializer(t *testing.T) {
20342082
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
20352083
Env: []corev1.EnvVar{
20362084
{Name: "HF_HOME", Value: "/tmp"},
2085+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
2086+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
2087+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
20372088
{
20382089
Name: s3.AWSAccessKeyId,
20392090
ValueFrom: &corev1.EnvVarSource{
@@ -2428,6 +2479,9 @@ func TestTransformerCollocation(t *testing.T) {
24282479
Resources: resourceRequirement,
24292480
Env: []corev1.EnvVar{
24302481
{Name: "HF_HOME", Value: "/tmp"},
2482+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
2483+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
2484+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
24312485
},
24322486
TerminationMessagePolicy: "FallbackToLogsOnError",
24332487
VolumeMounts: []corev1.VolumeMount{
@@ -2599,6 +2653,9 @@ func TestTransformerCollocation(t *testing.T) {
25992653
Resources: resourceRequirement,
26002654
Env: []corev1.EnvVar{
26012655
{Name: "HF_HOME", Value: "/tmp"},
2656+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
2657+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
2658+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
26022659
},
26032660
TerminationMessagePolicy: "FallbackToLogsOnError",
26042661
VolumeMounts: []corev1.VolumeMount{
@@ -2847,6 +2904,9 @@ func TestStorageContainerCRDInjection(t *testing.T) {
28472904
Env: []corev1.EnvVar{
28482905
{Name: "name", Value: "value"},
28492906
{Name: "HF_HOME", Value: "/tmp"},
2907+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
2908+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
2909+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
28502910
},
28512911
},
28522912
},
@@ -2903,6 +2963,9 @@ func TestStorageContainerCRDInjection(t *testing.T) {
29032963
Resources: resourceRequirement, // from configMap instead of the CR
29042964
Env: []corev1.EnvVar{
29052965
{Name: "HF_HOME", Value: "/tmp"},
2966+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
2967+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
2968+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
29062969
},
29072970
TerminationMessagePolicy: "FallbackToLogsOnError",
29082971
VolumeMounts: []corev1.VolumeMount{
@@ -3339,6 +3402,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
33393402
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
33403403
Env: []corev1.EnvVar{
33413404
{Name: "HF_HOME", Value: "/tmp"},
3405+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
3406+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
3407+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
33423408
},
33433409
Resources: resourceRequirement,
33443410
TerminationMessagePolicy: "FallbackToLogsOnError",
@@ -3414,6 +3480,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
34143480
Resources: resourceRequirement,
34153481
Env: []corev1.EnvVar{
34163482
{Name: "HF_HOME", Value: "/tmp"},
3483+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
3484+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
3485+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
34173486
},
34183487
TerminationMessagePolicy: "FallbackToLogsOnError",
34193488
VolumeMounts: []corev1.VolumeMount{
@@ -3501,6 +3570,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
35013570
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
35023571
Env: []corev1.EnvVar{
35033572
{Name: "HF_HOME", Value: "/tmp"},
3573+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
3574+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
3575+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
35043576
},
35053577
Resources: resourceRequirement,
35063578
TerminationMessagePolicy: "FallbackToLogsOnError",
@@ -3566,6 +3638,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
35663638
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
35673639
Env: []corev1.EnvVar{
35683640
{Name: "HF_HOME", Value: "/tmp"},
3641+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
3642+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
3643+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
35693644
},
35703645
Resources: resourceRequirement,
35713646
TerminationMessagePolicy: "FallbackToLogsOnError",
@@ -3643,6 +3718,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
36433718
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
36443719
Env: []corev1.EnvVar{
36453720
{Name: "HF_HOME", Value: "/tmp"},
3721+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
3722+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
3723+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
36463724
},
36473725
Resources: resourceRequirement,
36483726
TerminationMessagePolicy: "FallbackToLogsOnError",
@@ -3720,6 +3798,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
37203798
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
37213799
Env: []corev1.EnvVar{
37223800
{Name: "HF_HOME", Value: "/tmp"},
3801+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
3802+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
3803+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
37233804
},
37243805
Resources: resourceRequirement,
37253806
TerminationMessagePolicy: "FallbackToLogsOnError",
@@ -3797,6 +3878,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
37973878
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
37983879
Env: []corev1.EnvVar{
37993880
{Name: "HF_HOME", Value: "/tmp"},
3881+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
3882+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
3883+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
38003884
},
38013885
Resources: resourceRequirement,
38023886
TerminationMessagePolicy: "FallbackToLogsOnError",
@@ -3873,6 +3957,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
38733957
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
38743958
Env: []corev1.EnvVar{
38753959
{Name: "HF_HOME", Value: "/tmp"},
3960+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
3961+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
3962+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
38763963
},
38773964
Resources: resourceRequirement,
38783965
TerminationMessagePolicy: "FallbackToLogsOnError",
@@ -3949,6 +4036,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
39494036
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
39504037
Env: []corev1.EnvVar{
39514038
{Name: "HF_HOME", Value: "/tmp"},
4039+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
4040+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
4041+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
39524042
},
39534043
Resources: resourceRequirement,
39544044
TerminationMessagePolicy: "FallbackToLogsOnError",
@@ -4026,6 +4116,9 @@ func TestStorageInitializerUIDForIstioCNI(t *testing.T) {
40264116
Args: []string{"gs://foo", constants.DefaultModelLocalMountPath},
40274117
Env: []corev1.EnvVar{
40284118
{Name: "HF_HOME", Value: "/tmp"},
4119+
{Name: "HF_HUB_ENABLE_HF_TRANSFER", Value: "1"},
4120+
{Name: "HF_XET_HIGH_PERFORMANCE", Value: "1"},
4121+
{Name: "HF_XET_NUM_CONCURRENT_RANGE_GETS", Value: "8"},
40294122
},
40304123
Resources: resourceRequirement,
40314124
TerminationMessagePolicy: "FallbackToLogsOnError",

0 commit comments

Comments
 (0)