Skip to content

Commit 797cf9d

Browse files
authored
[Inference API] Rename Elastic Inference Service rerank model/endpoint (#137030)
1 parent c08a605 commit 797cf9d

File tree

5 files changed

+23
-22
lines changed

5 files changed

+23
-22
lines changed

x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/InferenceGetModelsWithElasticInferenceServiceIT.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@ public void testGetDefaultEndpoints() throws IOException {
5252
assertInferenceIdTaskType(allModels, ".rainbow-sprinkles-elastic", TaskType.CHAT_COMPLETION);
5353
assertInferenceIdTaskType(allModels, ".elser-2-elastic", TaskType.SPARSE_EMBEDDING);
5454
assertInferenceIdTaskType(allModels, ".jina-embeddings-v3", TaskType.TEXT_EMBEDDING);
55-
assertInferenceIdTaskType(allModels, ".rerank-v1-elastic", TaskType.RERANK);
55+
assertInferenceIdTaskType(allModels, ".elastic-rerank-v1", TaskType.RERANK);
5656
}
5757

5858
private static void assertInferenceIdTaskType(List<Map<String, Object>> models, String inferenceId, TaskType taskType) {

x-pack/plugin/inference/qa/inference-service-tests/src/javaRestTest/java/org/elasticsearch/xpack/inference/MockElasticInferenceServiceAuthorizationServer.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,7 @@ public void enqueueAuthorizeAllModelsResponse() {
4747
"task_types": ["embed/text/dense"]
4848
},
4949
{
50-
"model_name": "rerank-v1",
50+
"model_name": "elastic-rerank-v1",
5151
"task_types": ["rerank/text/text-similarity"]
5252
}
5353
]

x-pack/plugin/inference/src/internalClusterTest/java/org/elasticsearch/xpack/inference/integration/InferenceRevokeDefaultEndpointsIT.java

Lines changed: 9 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -207,7 +207,7 @@ public void testRemoves_DefaultChatCompletion_V1_WhenAuthorizationDoesNotReturnA
207207
"task_types": ["embed/text/dense"]
208208
},
209209
{
210-
"model_name": "rerank-v1",
210+
"model_name": "elastic-rerank-v1",
211211
"task_types": ["rerank/text/text-similarity"]
212212
}
213213
]
@@ -244,7 +244,7 @@ public void testRemoves_DefaultChatCompletion_V1_WhenAuthorizationDoesNotReturnA
244244
service
245245
),
246246
new InferenceService.DefaultConfigId(
247-
".rerank-v1-elastic",
247+
".elastic-rerank-v1",
248248
MinimalServiceSettings.rerank(ElasticInferenceService.NAME),
249249
service
250250
)
@@ -257,10 +257,11 @@ public void testRemoves_DefaultChatCompletion_V1_WhenAuthorizationDoesNotReturnA
257257

258258
PlainActionFuture<List<Model>> listener = new PlainActionFuture<>();
259259
service.defaultConfigs(listener);
260-
assertThat(listener.actionGet(TIMEOUT).get(0).getConfigurations().getInferenceEntityId(), is(".elser-2-elastic"));
261-
assertThat(listener.actionGet(TIMEOUT).get(1).getConfigurations().getInferenceEntityId(), is(".jina-embeddings-v3"));
262-
assertThat(listener.actionGet(TIMEOUT).get(2).getConfigurations().getInferenceEntityId(), is(".rainbow-sprinkles-elastic"));
263-
assertThat(listener.actionGet(TIMEOUT).get(3).getConfigurations().getInferenceEntityId(), is(".rerank-v1-elastic"));
260+
261+
assertThat(listener.actionGet(TIMEOUT).get(0).getConfigurations().getInferenceEntityId(), is(".elastic-rerank-v1"));
262+
assertThat(listener.actionGet(TIMEOUT).get(1).getConfigurations().getInferenceEntityId(), is(".elser-2-elastic"));
263+
assertThat(listener.actionGet(TIMEOUT).get(2).getConfigurations().getInferenceEntityId(), is(".jina-embeddings-v3"));
264+
assertThat(listener.actionGet(TIMEOUT).get(3).getConfigurations().getInferenceEntityId(), is(".rainbow-sprinkles-elastic"));
264265

265266
var getModelListener = new PlainActionFuture<UnparsedModel>();
266267
// persists the default endpoints
@@ -280,7 +281,7 @@ public void testRemoves_DefaultChatCompletion_V1_WhenAuthorizationDoesNotReturnA
280281
"task_types": ["embed/text/sparse"]
281282
},
282283
{
283-
"model_name": "rerank-v1",
284+
"model_name": "elastic-rerank-v1",
284285
"task_types": ["rerank/text/text-similarity"]
285286
},
286287
{
@@ -316,7 +317,7 @@ public void testRemoves_DefaultChatCompletion_V1_WhenAuthorizationDoesNotReturnA
316317
service
317318
),
318319
new InferenceService.DefaultConfigId(
319-
".rerank-v1-elastic",
320+
".elastic-rerank-v1",
320321
MinimalServiceSettings.rerank(ElasticInferenceService.NAME),
321322
service
322323
)

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/elastic/ElasticInferenceService.java

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -121,8 +121,8 @@ public class ElasticInferenceService extends SenderService {
121121
static final String DEFAULT_MULTILINGUAL_EMBED_ENDPOINT_ID = ".jina-embeddings-v3";
122122

123123
// rerank-v1
124-
static final String DEFAULT_RERANK_MODEL_ID_V1 = "rerank-v1";
125-
static final String DEFAULT_RERANK_ENDPOINT_ID_V1 = defaultEndpointId(DEFAULT_RERANK_MODEL_ID_V1);
124+
static final String DEFAULT_RERANK_MODEL_ID_V1 = "elastic-rerank-v1";
125+
static final String DEFAULT_RERANK_ENDPOINT_ID_V1 = ".elastic-rerank-v1";
126126

127127
/**
128128
* The task types that the {@link InferenceAction.Request} can accept.

x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/elastic/ElasticInferenceServiceTests.java

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1242,7 +1242,7 @@ public void testDefaultConfigs_Returns_DefaultEndpoints_WhenTaskTypeIsCorrect()
12421242
"task_types": ["embed/text/dense"]
12431243
},
12441244
{
1245-
"model_name": "rerank-v1",
1245+
"model_name": "elastic-rerank-v1",
12461246
"task_types": ["rerank/text/text-similarity"]
12471247
}
12481248
]
@@ -1260,6 +1260,11 @@ public void testDefaultConfigs_Returns_DefaultEndpoints_WhenTaskTypeIsCorrect()
12601260
service.defaultConfigIds(),
12611261
is(
12621262
List.of(
1263+
new InferenceService.DefaultConfigId(
1264+
".elastic-rerank-v1",
1265+
MinimalServiceSettings.rerank(ElasticInferenceService.NAME),
1266+
service
1267+
),
12631268
new InferenceService.DefaultConfigId(
12641269
".elser-2-elastic",
12651270
MinimalServiceSettings.sparseEmbedding(ElasticInferenceService.NAME),
@@ -1279,11 +1284,6 @@ public void testDefaultConfigs_Returns_DefaultEndpoints_WhenTaskTypeIsCorrect()
12791284
".rainbow-sprinkles-elastic",
12801285
MinimalServiceSettings.chatCompletion(ElasticInferenceService.NAME),
12811286
service
1282-
),
1283-
new InferenceService.DefaultConfigId(
1284-
".rerank-v1-elastic",
1285-
MinimalServiceSettings.rerank(ElasticInferenceService.NAME),
1286-
service
12871287
)
12881288
)
12891289
)
@@ -1297,10 +1297,10 @@ public void testDefaultConfigs_Returns_DefaultEndpoints_WhenTaskTypeIsCorrect()
12971297
service.defaultConfigs(listener);
12981298
var models = listener.actionGet(TIMEOUT);
12991299
assertThat(models.size(), is(4));
1300-
assertThat(models.get(0).getConfigurations().getInferenceEntityId(), is(".elser-2-elastic"));
1301-
assertThat(models.get(1).getConfigurations().getInferenceEntityId(), is(".jina-embeddings-v3"));
1302-
assertThat(models.get(2).getConfigurations().getInferenceEntityId(), is(".rainbow-sprinkles-elastic"));
1303-
assertThat(models.get(3).getConfigurations().getInferenceEntityId(), is(".rerank-v1-elastic"));
1300+
assertThat(models.get(0).getConfigurations().getInferenceEntityId(), is(".elastic-rerank-v1"));
1301+
assertThat(models.get(1).getConfigurations().getInferenceEntityId(), is(".elser-2-elastic"));
1302+
assertThat(models.get(2).getConfigurations().getInferenceEntityId(), is(".jina-embeddings-v3"));
1303+
assertThat(models.get(3).getConfigurations().getInferenceEntityId(), is(".rainbow-sprinkles-elastic"));
13041304
}
13051305
}
13061306

0 commit comments

Comments
 (0)