Skip to content

Commit 518ccd9

Browse files
kosabogileemthompodavidkyle
authored
Fixes descriptions in the Inference APIs (#5566)
* Improves descriptions in the Inference APIs * Update specification/inference/delete/DeleteRequest.ts Co-authored-by: Liam Thompson <[email protected]> * Update specification/inference/put/PutRequest.ts Co-authored-by: David Kyle <[email protected]> * Fixes chunking_settings object descriptions * Fixes oxford comma * Formatting fix --------- Co-authored-by: Liam Thompson <[email protected]> Co-authored-by: David Kyle <[email protected]>
1 parent cbedec9 commit 518ccd9

File tree

23 files changed

+42
-20
lines changed

23 files changed

+42
-20
lines changed

specification/inference/_types/CommonTypes.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -391,7 +391,7 @@ export class AlibabaCloudTaskSettings {
391391
export enum AlibabaCloudTaskType {
392392
completion,
393393
rerank,
394-
space_embedding,
394+
sparse_embedding,
395395
text_embedding
396396
}
397397

specification/inference/delete/DeleteRequest.ts

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,7 @@ import { TaskType } from '@inference/_types/TaskType'
2323

2424
/**
2525
* Delete an inference endpoint
26+
* This API requires the manage_inference cluster privilege (the built-in `inference_admin` role grants this privilege).
2627
* @rest_spec_name inference.delete
2728
* @availability stack since=8.11.0 stability=stable visibility=public
2829
* @availability serverless stability=stable visibility=public

specification/inference/get/GetRequest.ts

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,7 @@ import { TaskType } from '@inference/_types/TaskType'
2323

2424
/**
2525
* Get an inference endpoint
26+
* This API requires the `monitor_inference` cluster privilege (the built-in `inference_admin` and `inference_user` roles grant this privilege).
2627
* @rest_spec_name inference.get
2728
* @availability stack since=8.11.0 stability=stable visibility=public
2829
* @availability serverless stability=stable visibility=public

specification/inference/put_alibabacloud/PutAlibabaCloudRequest.ts

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -65,6 +65,8 @@ export interface Request extends RequestBase {
6565
body: {
6666
/**
6767
* The chunking configuration object.
68+
* Applies only to the `sparse_embedding` or `text_embedding` task types.
69+
* Not applicable to the `rerank` or `completion` task types.
6870
* @ext_doc_id inference-chunking
6971
*/
7072
chunking_settings?: InferenceChunkingSettings

specification/inference/put_amazonbedrock/PutAmazonBedrockRequest.ts

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -68,6 +68,8 @@ export interface Request extends RequestBase {
6868
body: {
6969
/**
7070
* The chunking configuration object.
71+
* Applies only to the `text_embedding` task type.
72+
* Not applicable to the `completion` task type.
7173
* @ext_doc_id inference-chunking
7274
*/
7375
chunking_settings?: InferenceChunkingSettings

specification/inference/put_amazonsagemaker/PutAmazonSageMakerRequest.ts

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -65,6 +65,8 @@ export interface Request extends RequestBase {
6565
body: {
6666
/**
6767
* The chunking configuration object.
68+
* Applies only to the `sparse_embedding` or `text_embedding` task types.
69+
* Not applicable to the `rerank`, `completion`, or `chat_completion` task types.
6870
* @ext_doc_id inference-chunking
6971
*/
7072
chunking_settings?: InferenceChunkingSettings

specification/inference/put_anthropic/PutAnthropicRequest.ts

Lines changed: 0 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,6 @@ import {
2626
AnthropicTaskSettings,
2727
AnthropicTaskType
2828
} from '@inference/_types/CommonTypes'
29-
import { InferenceChunkingSettings } from '@inference/_types/Services'
3029

3130
/**
3231
* Create an Anthropic inference endpoint.
@@ -64,11 +63,6 @@ export interface Request extends RequestBase {
6463
timeout?: Duration
6564
}
6665
body: {
67-
/**
68-
* The chunking configuration object.
69-
* @ext_doc_id inference-chunking
70-
*/
71-
chunking_settings?: InferenceChunkingSettings
7266
/**
7367
* The type of service supported for the specified task type. In this case, `anthropic`.
7468
*/

specification/inference/put_azureaistudio/PutAzureAiStudioRequest.ts

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -65,6 +65,8 @@ export interface Request extends RequestBase {
6565
body: {
6666
/**
6767
* The chunking configuration object.
68+
* Applies only to the `text_embedding` task type.
69+
* Not applicable to the `rerank` or `completion` task types.
6870
* @ext_doc_id inference-chunking
6971
*/
7072
chunking_settings?: InferenceChunkingSettings

specification/inference/put_azureopenai/PutAzureOpenAiRequest.ts

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -73,6 +73,8 @@ export interface Request extends RequestBase {
7373
body: {
7474
/**
7575
* The chunking configuration object.
76+
* Applies only to the `text_embedding` task type.
77+
* Not applicable to the `completion` task type.
7678
* @ext_doc_id inference-chunking
7779
*/
7880
chunking_settings?: InferenceChunkingSettings

specification/inference/put_cohere/PutCohereRequest.ts

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -65,6 +65,8 @@ export interface Request extends RequestBase {
6565
body: {
6666
/**
6767
* The chunking configuration object.
68+
* Applies only to the `text_embedding` task type.
69+
* Not applicable to the `rerank` or `completion` task type.
6870
* @ext_doc_id inference-chunking
6971
*/
7072
chunking_settings?: InferenceChunkingSettings

0 commit comments

Comments
 (0)