From 79f3b532668346c6162c9b808d69ec8586b96a48 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Istv=C3=A1n=20Zolt=C3=A1n=20Szab=C3=B3?= Date: Thu, 13 Mar 2025 15:03:03 +0100 Subject: [PATCH 1/4] [8.x][DOCS] Removes sparse_embedding references from EIS docs. --- .../inference/elastic-infer-service.asciidoc | 25 +++++-------------- 1 file changed, 6 insertions(+), 19 deletions(-) diff --git a/docs/reference/inference/elastic-infer-service.asciidoc b/docs/reference/inference/elastic-infer-service.asciidoc index 94f2f1992db7c..65d89d116a4a7 100644 --- a/docs/reference/inference/elastic-infer-service.asciidoc +++ b/docs/reference/inference/elastic-infer-service.asciidoc @@ -33,8 +33,7 @@ include::inference-shared.asciidoc[tag=task-type] -- Available task types: -* `chat_completion`, -* `sparse_embedding`. +* `chat_completion` -- [NOTE] @@ -49,6 +48,10 @@ include::inference-shared.asciidoc[tag=chat-completion-docs] ==== {api-request-body-title} +`chunking_settings`:: +(Optional, object) +include::inference-shared.asciidoc[tag=chunking-settings] + `max_chunk_size`::: (Optional, integer) include::inference-shared.asciidoc[tag=chunking-settings-max-chunking-size] @@ -93,22 +96,6 @@ include::inference-shared.asciidoc[tag=request-per-minute-example] [[inference-example-elastic]] ==== Elastic {infer-cap} Service example - -The following example shows how to create an {infer} endpoint called `elser-model-eis` to perform a `text_embedding` task type. - -[source,console] ------------------------------------------------------------- -PUT _inference/sparse_embedding/elser-model-eis -{ - "service": "elastic", - "service_settings": { - "model_name": "elser" - } -} - ------------------------------------------------------------- -// TEST[skip:TBD] - The following example shows how to create an {infer} endpoint called `chat-completion-endpoint` to perform a `chat_completion` task type. [source,console] @@ -117,7 +104,7 @@ PUT /_inference/chat_completion/chat-completion-endpoint { "service": "elastic", "service_settings": { - "model_id": "model-1" + "model_id": ".rainbow-sprinkles-elastic" } } ------------------------------------------------------------ From 9ef5db8a57d0eee1eb68fe850dde7e83d0111884 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Istv=C3=A1n=20Zolt=C3=A1n=20Szab=C3=B3?= Date: Thu, 13 Mar 2025 15:24:20 +0100 Subject: [PATCH 2/4] Update docs/reference/inference/elastic-infer-service.asciidoc --- docs/reference/inference/elastic-infer-service.asciidoc | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/reference/inference/elastic-infer-service.asciidoc b/docs/reference/inference/elastic-infer-service.asciidoc index 65d89d116a4a7..27cc82961d912 100644 --- a/docs/reference/inference/elastic-infer-service.asciidoc +++ b/docs/reference/inference/elastic-infer-service.asciidoc @@ -104,7 +104,7 @@ PUT /_inference/chat_completion/chat-completion-endpoint { "service": "elastic", "service_settings": { - "model_id": ".rainbow-sprinkles-elastic" + "model_id": ".rainbow-sprinkles" } } ------------------------------------------------------------ From 315f0e5bbb16725e15be60c7ddc3a686133efe1e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Istv=C3=A1n=20Zolt=C3=A1n=20Szab=C3=B3?= Date: Thu, 13 Mar 2025 15:34:58 +0100 Subject: [PATCH 3/4] Update docs/reference/inference/elastic-infer-service.asciidoc --- docs/reference/inference/elastic-infer-service.asciidoc | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/reference/inference/elastic-infer-service.asciidoc b/docs/reference/inference/elastic-infer-service.asciidoc index 27cc82961d912..495fe9c060bdf 100644 --- a/docs/reference/inference/elastic-infer-service.asciidoc +++ b/docs/reference/inference/elastic-infer-service.asciidoc @@ -104,7 +104,7 @@ PUT /_inference/chat_completion/chat-completion-endpoint { "service": "elastic", "service_settings": { - "model_id": ".rainbow-sprinkles" + "model_id": "rainbow-sprinkles" } } ------------------------------------------------------------ From d0a7cc88389360ec85d812ae5de6a21273ac2736 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Istv=C3=A1n=20Zolt=C3=A1n=20Szab=C3=B3?= Date: Mon, 17 Mar 2025 15:15:13 +0100 Subject: [PATCH 4/4] Apply suggestions from code review --- docs/reference/inference/elastic-infer-service.asciidoc | 3 --- 1 file changed, 3 deletions(-) diff --git a/docs/reference/inference/elastic-infer-service.asciidoc b/docs/reference/inference/elastic-infer-service.asciidoc index 495fe9c060bdf..291b82798fffc 100644 --- a/docs/reference/inference/elastic-infer-service.asciidoc +++ b/docs/reference/inference/elastic-infer-service.asciidoc @@ -48,9 +48,6 @@ include::inference-shared.asciidoc[tag=chat-completion-docs] ==== {api-request-body-title} -`chunking_settings`:: -(Optional, object) -include::inference-shared.asciidoc[tag=chunking-settings] `max_chunk_size`::: (Optional, integer)