Skip to content

Commit e0963ae

Browse files
committed
Adds examples.
1 parent 61c6a98 commit e0963ae

File tree

5 files changed

+129
-0
lines changed

5 files changed

+129
-0
lines changed
Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
summary: Custom text embedding task (OpenAI)
2+
description: Run `PUT _inference/text_embedding/custom-embeddings` to create an inference endpoint that performs a text embedding task.
3+
method_request: 'PUT _inference/text_embedding/custom-embeddings'
4+
# type: "request"
5+
value: |-
6+
{
7+
"service": "custom",
8+
"service_settings": {
9+
"secret_parameters": {
10+
"api_key": "<api key>"
11+
},
12+
"url": "https://api.openai.com/v1/embeddings",
13+
"headers": {
14+
"Authorization": "Bearer ${api_key}",
15+
"Content-Type": "application/json;charset=utf-8"
16+
},
17+
"request": "{\"input\": ${input}, \"model\": \"text-embedding-3-small\"}",
18+
"response": {
19+
"json_parser": {
20+
"text_embeddings": "$.data[*].embedding[*]"
21+
}
22+
}
23+
}
24+
}
Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
summary: Custom rerank task (Cohere APIv2)
2+
description: Run `PUT _inference/rerank/custom-rerank` to create an inference endpoint that performs a rerank task.
3+
method_request: 'PUT _inference/rerank/custom-rerank'
4+
# type: "request"
5+
value: |-
6+
{
7+
"service": "custom",
8+
"service_settings": {
9+
"secret_parameters": {
10+
"api_key": "<api key>"
11+
},
12+
"url": "https://api.cohere.com/v2/rerank",
13+
"headers": {
14+
"Authorization": "bearer ${api_key}",
15+
"Content-Type": "application/json"
16+
},
17+
"request": "{\"documents\": ${input}, \"query\": ${query}, \"model\": \"rerank-v3.5\"}",
18+
"response": {
19+
"json_parser": {
20+
"reranked_index":"$.results[*].index",
21+
"relevance_score":"$.results[*].relevance_score"
22+
}
23+
}
24+
}
25+
}
Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,31 @@
1+
summary: Custom text embedding task (Cohere APIv2)
2+
description: Run `PUT _inference/text_embedding/custom-text-embedding` to create an inference endpoint that performs a text embedding task.
3+
method_request: 'PUT _inference/text_embedding/custom-text-embedding'
4+
# type: "request"
5+
value: |-
6+
{
7+
"service": "custom",
8+
"service_settings": {
9+
"secret_parameters": {
10+
"api_key": "<api key>"
11+
},
12+
"url": "https://api.cohere.com/v2/embed",
13+
"headers": {
14+
"Authorization": "bearer ${api_key}",
15+
"Content-Type": "application/json"
16+
},
17+
"request": "{\"texts\": ${input}, \"model\": \"embed-v4.0\", \"input_type\": ${input_type}}",
18+
"response": {
19+
"json_parser": {
20+
"text_embeddings":"$.embeddings.float[*]"
21+
}
22+
},
23+
"input_type": {
24+
"translation": {
25+
"ingest": "search_document",
26+
"search": "search_query"
27+
},
28+
"default": "search_document"
29+
}
30+
}
31+
}
Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
summary: Custom rerank task (Jina AI)
2+
description: Run `PUT _inference/rerank/custom-rerank-jina` to create an inference endpoint that performs a rerank task.
3+
method_request: 'PUT _inference/rerank/custom-rerank-jina'
4+
# type: "request"
5+
value: |-
6+
{
7+
"service": "custom",
8+
"service_settings": {
9+
"secret_parameters": {
10+
"api_key": "<api key>"
11+
},
12+
"url": "https://api.jina.ai/v1/rerank",
13+
"headers": {
14+
"Content-Type": "application/json",
15+
"Authorization": "Bearer ${api_key}"
16+
},
17+
"request": "{\"model\": \"jina-reranker-v2-base-multilingual\",\"query\": ${query},\"documents\":${input}}",
18+
"response": {
19+
"json_parser": {
20+
"relevance_score": "$.results[*].relevance_score",
21+
"reranked_index": "$.results[*].index"
22+
}
23+
}
24+
}
25+
}
Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
summary: Custom text embedding task (Hugging Face)
2+
description: Run `PUT _inference/text_embedding/custom-text-embedding-hf` to create an inference endpoint that performs a text embedding task by using the Qwen/Qwen3-Embedding-8B model.
3+
method_request: 'PUT _inference/text_embedding/custom-text-embedding-hf'
4+
# type: "request"
5+
value: |-
6+
{
7+
"service": "custom",
8+
"service_settings": {
9+
"secret_parameters": {
10+
"api_key": "<api key>"
11+
},
12+
"url": "<dedicated inference endpoint on HF>/v1/embeddings",
13+
"headers": {
14+
"Authorization": "Bearer ${api_key}",
15+
"Content-Type": "application/json"
16+
},
17+
"request": "{\"input\": ${input}}",
18+
"response": {
19+
"json_parser": {
20+
"text_embeddings":"$.data[*].embedding[*]"
21+
}
22+
}
23+
}
24+
}

0 commit comments

Comments
 (0)