Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion specification/inference/_types/CommonTypes.ts
Original file line number Diff line number Diff line change
Expand Up @@ -391,7 +391,7 @@ export class AlibabaCloudTaskSettings {
export enum AlibabaCloudTaskType {
completion,
rerank,
space_embedding,
sparse_embedding,
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

😁

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

🧑‍🚀

text_embedding
}

Expand Down
1 change: 1 addition & 0 deletions specification/inference/delete/DeleteRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -23,6 +23,7 @@ import { TaskType } from '@inference/_types/TaskType'

/**
* Delete an inference endpoint
* This API requires the manage_inference cluster privilege (the built-in `inference_admin` role grants this privilege).
* @rest_spec_name inference.delete
* @availability stack since=8.11.0 stability=stable visibility=public
* @availability serverless stability=stable visibility=public
Expand Down
1 change: 1 addition & 0 deletions specification/inference/get/GetRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -23,6 +23,7 @@ import { TaskType } from '@inference/_types/TaskType'

/**
* Get an inference endpoint
* This API requires the `monitor_inference` cluster privilege (the built-in `inference_admin` and `inference_user` roles grant this privilege).
* @rest_spec_name inference.get
* @availability stack since=8.11.0 stability=stable visibility=public
* @availability serverless stability=stable visibility=public
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -65,6 +65,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `sparse_embedding` or `text_embedding` task types.
* Not applicable to the `rerank` or `completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -68,6 +68,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `completion` task type.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -65,6 +65,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `sparse_embedding` or `text_embedding` task types.
* Not applicable to the `rerank`, `completion`, or `chat_completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
6 changes: 0 additions & 6 deletions specification/inference/put_anthropic/PutAnthropicRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,6 @@ import {
AnthropicTaskSettings,
AnthropicTaskType
} from '@inference/_types/CommonTypes'
import { InferenceChunkingSettings } from '@inference/_types/Services'

/**
* Create an Anthropic inference endpoint.
Expand Down Expand Up @@ -64,11 +63,6 @@ export interface Request extends RequestBase {
timeout?: Duration
}
body: {
/**
* The chunking configuration object.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
/**
* The type of service supported for the specified task type. In this case, `anthropic`.
*/
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -65,6 +65,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `rerank` or `completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -73,6 +73,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `completion` task type.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
2 changes: 2 additions & 0 deletions specification/inference/put_cohere/PutCohereRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -65,6 +65,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `rerank` or `completion` task type.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,6 @@ import {
ContextualAIServiceType,
ContextualAITaskSettings
} from '@inference/_types/CommonTypes'
import { InferenceChunkingSettings } from '@inference/_types/Services'
import { TaskTypeContextualAI } from '@inference/_types/TaskType'

/**
Expand Down Expand Up @@ -65,11 +64,6 @@ export interface Request extends RequestBase {
timeout?: Duration
}
body: {
/**
* The chunking configuration object.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
/**
* The type of service supported for the specified task type. In this case, `contextualai`.
*/
Expand Down
2 changes: 2 additions & 0 deletions specification/inference/put_custom/PutCustomRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -96,6 +96,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `sparse_embedding` or `text_embedding` task types.
* Not applicable to the `rerank` or `completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
6 changes: 0 additions & 6 deletions specification/inference/put_deepseek/PutDeepSeekRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,6 @@ import {
DeepSeekServiceSettings,
DeepSeekServiceType
} from '@inference/_types/CommonTypes'
import { InferenceChunkingSettings } from '@inference/_types/Services'
import { TaskTypeDeepSeek } from '@inference/_types/TaskType'

/**
Expand Down Expand Up @@ -62,11 +61,6 @@ export interface Request extends RequestBase {
timeout?: Duration
}
body: {
/**
* The chunking configuration object.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
/**
* The type of service supported for the specified task type. In this case, `deepseek`.
*/
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -80,7 +80,7 @@ export interface Request extends RequestBase {
/**
* The chunking configuration object.
* Applies only to the `sparse_embedding` and `text_embedding` task types.
* Not applicable to the `rerank`, `completion`, or `chat_completion` task types.
* Not applicable to the `rerank` task type.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -64,6 +64,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `completion` task type.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -65,6 +65,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `rerank`, `completion`, or `chat_completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -101,6 +101,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `rerank`, `completion`, or `chat_completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
2 changes: 2 additions & 0 deletions specification/inference/put_jinaai/PutJinaAiRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -68,6 +68,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `rerank` task type.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
2 changes: 2 additions & 0 deletions specification/inference/put_llama/PutLlamaRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -64,6 +64,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `completion` or `chat_completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
2 changes: 2 additions & 0 deletions specification/inference/put_mistral/PutMistralRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -64,6 +64,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `completion` or `chat_completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
2 changes: 2 additions & 0 deletions specification/inference/put_openai/PutOpenAiRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -66,6 +66,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `completion` or `chat_completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
2 changes: 2 additions & 0 deletions specification/inference/put_voyageai/PutVoyageAIRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -67,6 +67,8 @@ export interface Request extends RequestBase {
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `rerank` task type.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
Expand Down
8 changes: 8 additions & 0 deletions specification/inference/put_watsonx/PutWatsonxRequest.ts
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,7 @@ import {
WatsonxServiceType,
WatsonxTaskType
} from '@inference/_types/CommonTypes'
import { InferenceChunkingSettings } from '@inference/_types/Services'

/**
* Create a Watsonx inference endpoint.
Expand Down Expand Up @@ -63,6 +64,13 @@ export interface Request extends RequestBase {
timeout?: Duration
}
body: {
/**
* The chunking configuration object.
* Applies only to the `text_embedding` task type.
* Not applicable to the `completion` or `chat_completion` task types.
* @ext_doc_id inference-chunking
*/
chunking_settings?: InferenceChunkingSettings
/**
* The type of service supported for the specified task type. In this case, `watsonxai`.
*/
Expand Down