Skip to content

Commit d1409df

Browse files
committed
Update specification to clarify max chunking settings
1 parent 1e78a79 commit d1409df

File tree

2 files changed

+4
-2
lines changed

2 files changed

+4
-2
lines changed

specification/inference/_types/Services.ts

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -316,7 +316,8 @@ export class InferenceEndpointInfoWatsonx extends InferenceEndpoint {
316316
export class InferenceChunkingSettings {
317317
/**
318318
* The maximum size of a chunk in words.
319-
* This value cannot be higher than `300` or lower than `20` (for `sentence` strategy) or `10` (for `word` strategy).
319+
* This value cannot be lower than `20` (for `sentence` strategy) or `10` (for `word` strategy).
320+
* This value should not exceed the window size for the associated model.
320321
* @server_default 250
321322
*/
322323
max_chunk_size?: integer

specification/inference/put_elser/PutElserRequest.ts

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -78,7 +78,8 @@ export interface Request extends RequestBase {
7878
}
7979
body: {
8080
/**
81-
* The chunking configuration object.
81+
* The chunking configuration object.
82+
* Note that for ELSER endpoints, the max_chunk_size may not exceed `300`.
8283
* @ext_doc_id inference-chunking
8384
*/
8485
chunking_settings?: InferenceChunkingSettings

0 commit comments

Comments
 (0)