Skip to content

Commit 2c1cece

Browse files
Some fixes (#248)
1 parent d0319e2 commit 2c1cece

File tree

3 files changed

+12
-6
lines changed

3 files changed

+12
-6
lines changed

charts/model-engine/templates/balloon_cpu_deployment.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -34,7 +34,7 @@ spec:
3434
resources:
3535
limits:
3636
memory: 28Gi
37-
cpu: 8
37+
cpu: 6
3838
command:
3939
- /bin/bash
4040
- -c

clients/python/llmengine/model.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -41,10 +41,10 @@ def create(
4141
quantize: Optional[Quantization] = None,
4242
checkpoint_path: Optional[str] = None,
4343
# General endpoint fields
44-
cpus: int = 32,
45-
memory: str = "192Gi",
44+
cpus: int = 8,
45+
memory: str = "40Gi",
4646
storage: str = "96Gi",
47-
gpus: int = 4,
47+
gpus: int = 1,
4848
min_workers: int = 0,
4949
max_workers: int = 1,
5050
per_worker: int = 10,

model-engine/model_engine_server/infra/services/image_cache_service.py

Lines changed: 8 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -128,7 +128,9 @@ async def execute(self, endpoint_infra_states: Dict[str, Tuple[bool, ModelEndpoi
128128
if state.resource_state.gpus == 0 and (
129129
(
130130
state.image not in images_to_cache_priority["cpu"]
131-
or last_updated_at
131+
or last_updated_at.replace(
132+
tzinfo=images_to_cache_priority["cpu"][state.image].last_updated_at.tzinfo
133+
)
132134
> images_to_cache_priority["cpu"][state.image].last_updated_at
133135
)
134136
and self.docker_repository.image_exists(image_tag, repository_name)
@@ -143,7 +145,11 @@ async def execute(self, endpoint_infra_states: Dict[str, Tuple[bool, ModelEndpoi
143145
if state.resource_state.gpu_type == gpu_type and (
144146
(
145147
state.image not in images_to_cache_priority[key]
146-
or last_updated_at
148+
or last_updated_at.replace(
149+
tzinfo=images_to_cache_priority[key][
150+
state.image
151+
].last_updated_at.tzinfo
152+
)
147153
> images_to_cache_priority[key][state.image].last_updated_at
148154
)
149155
and self.docker_repository.image_exists(image_tag, repository_name)

0 commit comments

Comments
 (0)