Skip to content

Commit 28ac358

Browse files
authored
[fix] Fix setting default rolling batch and extract lora adapter (#2931)
1 parent dd58f95 commit 28ac358

File tree

2 files changed

+1
-2
lines changed

2 files changed

+1
-2
lines changed

engines/python/setup/djl_python/async_utils.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -128,7 +128,7 @@ def _extract_lora_adapter(raw_request, decoded_payload):
128128
SAGEMAKER_ADAPTER_IDENTIFIER_HEADER)
129129
logging.debug(f"Found adapter in headers: {adapter_name}")
130130
elif "adapters" in decoded_payload:
131-
adapter_name = decoded_payload.get("adapters")
131+
adapter_name = decoded_payload.pop("adapters")
132132
logging.debug(f"Found adapter in payload: {adapter_name}")
133133

134134
return adapter_name

wlm/src/main/java/ai/djl/serving/wlm/LmiConfigRecommender.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -82,7 +82,6 @@ private static void setRollingBatch(
8282
rollingBatch = "trtllm";
8383
} else {
8484
rollingBatch = "disable";
85-
lmiProperties.setProperty("option.async_mode", "true");
8685
}
8786
lmiProperties.setProperty("option.rolling_batch", rollingBatch);
8887
}

0 commit comments

Comments
 (0)