Skip to content

Commit b19c0c1

Browse files
jonathan-buttnerjozala
authored andcommitted
Lowering the allocations during update to fit within available processors
1 parent 61c3d15 commit b19c0c1

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/CreateFromDeploymentIT.java

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -51,7 +51,7 @@ public void testAttachToDeployment() throws IOException {
5151
var results = infer(inferenceId, List.of("washing machine"));
5252
assertNotNull(results.get("sparse_embedding"));
5353

54-
var updatedNumAllocations = randomIntBetween(1, 10);
54+
var updatedNumAllocations = randomIntBetween(1, 2);
5555
var updatedEndpointConfig = updateEndpoint(inferenceId, updatedEndpointConfig(updatedNumAllocations), TaskType.SPARSE_EMBEDDING);
5656
assertThat(
5757
updatedEndpointConfig.get("service_settings"),
@@ -128,7 +128,7 @@ public void testAttachWithModelId() throws IOException {
128128
var results = infer(inferenceId, List.of("washing machine"));
129129
assertNotNull(results.get("sparse_embedding"));
130130

131-
var updatedNumAllocations = randomIntBetween(1, 10);
131+
var updatedNumAllocations = randomIntBetween(1, 2);
132132
var updatedEndpointConfig = updateEndpoint(inferenceId, updatedEndpointConfig(updatedNumAllocations), TaskType.SPARSE_EMBEDDING);
133133
assertThat(
134134
updatedEndpointConfig.get("service_settings"),

0 commit comments

Comments
 (0)