Skip to content

Commit d42eb87

Browse files
authored
Merge branch 'main' into tests/refine_assertion
2 parents 269fe84 + d6e2b57 commit d42eb87

File tree

55 files changed

+715
-143
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

55 files changed

+715
-143
lines changed

.backportrc.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,9 @@
11
{
22
"upstream" : "elastic/elasticsearch",
3-
"targetBranchChoices" : [ "main", "9.0", "8.19", "8.18", "8.17", "8.16", "8.15", "8.14", "8.13", "8.12", "8.11", "8.10", "8.9", "8.8", "8.7", "8.6", "8.5", "8.4", "8.3", "8.2", "8.1", "8.0", "7.17", "6.8" ],
3+
"targetBranchChoices" : [ "main", "9.1", "9.0", "8.19", "8.18", "8.17", "8.16", "8.15", "8.14", "8.13", "8.12", "8.11", "8.10", "8.9", "8.8", "8.7", "8.6", "8.5", "8.4", "8.3", "8.2", "8.1", "8.0", "7.17", "6.8" ],
44
"targetPRLabels" : [ "backport" ],
55
"branchLabelMapping" : {
6-
"^v9.1.0$" : "main",
6+
"^v9.2.0$" : "main",
77
"^v(\\d+).(\\d+).\\d+(?:-(?:alpha|beta|rc)\\d+)?$" : "$1.$2"
88
}
99
}

.buildkite/pipelines/intake.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -65,7 +65,7 @@ steps:
6565
timeout_in_minutes: 300
6666
matrix:
6767
setup:
68-
BWC_VERSION: ["8.17.9", "8.18.4", "8.19.0", "9.0.4", "9.1.0"]
68+
BWC_VERSION: ["8.17.9", "8.18.4", "8.19.0", "9.0.4", "9.1.0", "9.2.0"]
6969
agents:
7070
provider: gcp
7171
image: family/elasticsearch-ubuntu-2404

.buildkite/pipelines/periodic-packaging.yml

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -382,6 +382,22 @@ steps:
382382
env:
383383
BWC_VERSION: 9.1.0
384384

385+
- label: "{{matrix.image}} / 9.2.0 / packaging-tests-upgrade"
386+
command: ./.ci/scripts/packaging-test.sh -Dbwc.checkout.align=true destructiveDistroUpgradeTest.v9.2.0
387+
timeout_in_minutes: 300
388+
matrix:
389+
setup:
390+
image:
391+
- rocky-8
392+
- ubuntu-2404
393+
agents:
394+
provider: gcp
395+
image: family/elasticsearch-{{matrix.image}}
396+
machineType: custom-16-32768
397+
buildDirectory: /dev/shm/bk
398+
env:
399+
BWC_VERSION: 9.2.0
400+
385401
- group: packaging-tests-windows
386402
steps:
387403
- label: "{{matrix.image}} / packaging-tests-windows"

.buildkite/pipelines/periodic.yml

Lines changed: 21 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -420,6 +420,25 @@ steps:
420420
- signal_reason: agent_stop
421421
limit: 3
422422

423+
- label: 9.2.0 / bwc
424+
command: .ci/scripts/run-gradle.sh -Dbwc.checkout.align=true v9.2.0#bwcTest
425+
timeout_in_minutes: 300
426+
agents:
427+
provider: gcp
428+
image: family/elasticsearch-ubuntu-2404
429+
machineType: n1-standard-32
430+
buildDirectory: /dev/shm/bk
431+
preemptible: true
432+
env:
433+
BWC_VERSION: 9.2.0
434+
retry:
435+
automatic:
436+
- exit_status: "-1"
437+
limit: 3
438+
signal_reason: none
439+
- signal_reason: agent_stop
440+
limit: 3
441+
423442
- label: concurrent-search-tests
424443
command: .ci/scripts/run-gradle.sh -Dbwc.checkout.align=true -Dtests.jvm.argline=-Des.concurrent_search=true -Des.concurrent_search=true functionalTests
425444
timeout_in_minutes: 420
@@ -487,7 +506,7 @@ steps:
487506
setup:
488507
ES_RUNTIME_JAVA:
489508
- openjdk21
490-
BWC_VERSION: ["8.17.9", "8.18.4", "8.19.0", "9.0.4", "9.1.0"]
509+
BWC_VERSION: ["8.17.9", "8.18.4", "8.19.0", "9.0.4", "9.1.0", "9.2.0"]
491510
agents:
492511
provider: gcp
493512
image: family/elasticsearch-ubuntu-2404
@@ -531,7 +550,7 @@ steps:
531550
ES_RUNTIME_JAVA:
532551
- openjdk21
533552
- openjdk23
534-
BWC_VERSION: ["8.17.9", "8.18.4", "8.19.0", "9.0.4", "9.1.0"]
553+
BWC_VERSION: ["8.17.9", "8.18.4", "8.19.0", "9.0.4", "9.1.0", "9.2.0"]
535554
agents:
536555
provider: gcp
537556
image: family/elasticsearch-ubuntu-2404

.ci/bwcVersions

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -21,3 +21,4 @@ BWC_VERSION:
2121
- "8.19.0"
2222
- "9.0.4"
2323
- "9.1.0"
24+
- "9.2.0"

.ci/snapshotBwcVersions

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,3 +4,4 @@ BWC_VERSION:
44
- "8.19.0"
55
- "9.0.4"
66
- "9.1.0"
7+
- "9.2.0"

build-tools-internal/version.properties

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
elasticsearch = 9.1.0
1+
elasticsearch = 9.2.0
22
lucene = 10.2.2
33

44
bundled_jdk_vendor = openjdk

docs/changelog/129967.yaml

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
pr: 129967
2+
summary: Support returning default `index_options` for `semantic_text` fields when
3+
`include_defaults` is true
4+
area: Search
5+
type: bug
6+
issues: []

docs/changelog/130027.yaml

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
pr: 130027
2+
summary: "Fix: prevent duplication of \"invalid index name\" string in the final exception\
3+
\ error message"
4+
area: ES|QL
5+
type: bug
6+
issues: []

docs/reference/elasticsearch/mapping-reference/semantic-text.md

Lines changed: 34 additions & 35 deletions
Original file line numberDiff line numberDiff line change
@@ -112,32 +112,11 @@ to create the endpoint. If not specified, the {{infer}} endpoint defined by
112112
`inference_id` will be used at both index and query time.
113113

114114
`index_options`
115-
: (Optional, string) Specifies the index options to override default values
115+
: (Optional, object) Specifies the index options to override default values
116116
for the field. Currently, `dense_vector` index options are supported.
117117
For text embeddings, `index_options` may match any allowed
118118
[dense_vector index options](/reference/elasticsearch/mapping-reference/dense-vector.md#dense-vector-index-options).
119119

120-
An example of how to set index_options for a `semantic_text` field:
121-
122-
```console
123-
PUT my-index-000004
124-
{
125-
"mappings": {
126-
"properties": {
127-
"inference_field": {
128-
"type": "semantic_text",
129-
"inference_id": "my-text-embedding-endpoint",
130-
"index_options": {
131-
"dense_vector": {
132-
"type": "int4_flat"
133-
}
134-
}
135-
}
136-
}
137-
}
138-
}
139-
```
140-
141120
`chunking_settings`
142121
: (Optional, object) Settings for chunking text into smaller passages.
143122
If specified, these will override the chunking settings set in the {{infer-cap}}
@@ -165,7 +144,7 @@ To completely disable chunking, use the `none` chunking strategy.
165144
or `1`. Required for `sentence` type chunking settings
166145

167146
::::{warning}
168-
If the input exceeds the maximum token limit of the underlying model, some
147+
When using the `none` chunking strategy, if the input exceeds the maximum token limit of the underlying model, some
169148
services (such as OpenAI) may return an
170149
error. In contrast, the `elastic` and `elasticsearch` services will
171150
automatically truncate the input to fit within the
@@ -315,18 +294,38 @@ specified. It enables you to quickstart your semantic search by providing
315294
automatic {{infer}} and a dedicated query so you don’t need to provide further
316295
details.
317296

318-
In case you want to customize data indexing, use the [
319-
`sparse_vector`](/reference/elasticsearch/mapping-reference/sparse-vector.md)
320-
or [`dense_vector`](/reference/elasticsearch/mapping-reference/dense-vector.md)
321-
field types and create an ingest pipeline with
322-
an [{{infer}} processor](/reference/enrich-processor/inference-processor.md) to
323-
generate the
324-
embeddings. [This tutorial](docs-content://solutions/search/semantic-search/semantic-search-inference.md)
325-
walks you through the process. In these cases - when you use `sparse_vector` or
326-
`dense_vector` field types instead of the `semantic_text` field type to
327-
customize indexing - using the [
328-
`semantic_query`](/reference/query-languages/query-dsl/query-dsl-semantic-query.md)
329-
is not supported for querying the field data.
297+
If you want to override those defaults and customize the embeddings that
298+
`semantic_text` indexes, you can do so by modifying <<semantic-text-params,
299+
parameters>>:
300+
301+
- Use `index_options` to specify alternate index options such as specific
302+
`dense_vector` quantization methods
303+
- Use `chunking_settings` to override the chunking strategy associated with the
304+
{{infer}} endpoint, or completely disable chunking using the `none` type
305+
306+
Here is an example of how to set these parameters for a text embedding endpoint:
307+
308+
```console
309+
PUT my-index-000004
310+
{
311+
"mappings": {
312+
"properties": {
313+
"inference_field": {
314+
"type": "semantic_text",
315+
"inference_id": "my-text-embedding-endpoint",
316+
"index_options": {
317+
"dense_vector": {
318+
"type": "int4_flat"
319+
}
320+
},
321+
"chunking_settings": {
322+
"type": "none"
323+
}
324+
}
325+
}
326+
}
327+
}
328+
```
330329

331330
## Updates to `semantic_text` fields [update-script]
332331

0 commit comments

Comments
 (0)