diff --git a/src/components/ModelCatalog.tsx b/src/components/ModelCatalog.tsx
index e1b1837eb87e4b..31164f0330054c 100644
--- a/src/components/ModelCatalog.tsx
+++ b/src/components/ModelCatalog.tsx
@@ -80,6 +80,10 @@ const ModelCatalog = ({ models }: { models: WorkersAIModelsSchema[] }) => {
return "Function calling";
}
+ if (property_id === "async_queue" && value === "true") {
+ return "Batch";
+ }
+
return [];
})
.filter((p) => Boolean(p)),
@@ -102,6 +106,10 @@ const ModelCatalog = ({ models }: { models: WorkersAIModelsSchema[] }) => {
return "Function calling";
}
+ if (property_id === "async_queue" && value === "true") {
+ return "Batch";
+ }
+
return [];
})
.filter((p) => Boolean(p)),
diff --git a/src/components/models/ModelBadges.tsx b/src/components/models/ModelBadges.tsx
index 8babe92155375f..8b3c751dfebbc0 100644
--- a/src/components/models/ModelBadges.tsx
+++ b/src/components/models/ModelBadges.tsx
@@ -16,6 +16,13 @@ const ModelBadges = ({ model }: { model: WorkersAIModelsSchema }) => {
};
}
+ if (property_id === "async_queue" && value === "true") {
+ return {
+ variant: "note",
+ text: "Batch",
+ };
+ }
+
if (property_id === "planned_deprecation_date") {
const timestamp = Math.floor(new Date(value as string).getTime() / 1000);
diff --git a/src/components/models/ModelFeatures.tsx b/src/components/models/ModelFeatures.tsx
index 989c3930195797..a5ffe34acd6602 100644
--- a/src/components/models/ModelFeatures.tsx
+++ b/src/components/models/ModelFeatures.tsx
@@ -110,6 +110,12 @@ const ModelFeatures = ({ model }: { model: WorkersAIModelsSchema }) => {
Yes |
)}
+ {properties.async_queue && (
+
+ | Batch |
+ Yes |
+
+ )}
{properties.price && properties.price.length > 0 && (
| Unit Pricing |
diff --git a/src/content/workers-ai-models/bart-large-cnn.json b/src/content/workers-ai-models/bart-large-cnn.json
index e6918212ab67d8..96685f5a515cf9 100644
--- a/src/content/workers-ai-models/bart-large-cnn.json
+++ b/src/content/workers-ai-models/bart-large-cnn.json
@@ -14,6 +14,16 @@
{
"property_id": "beta",
"value": "true"
+ },
+ {
+ "property_id": "price",
+ "value": [
+ {
+ "unit": "per M input tokens",
+ "price": 0,
+ "currency": "USD"
+ }
+ ]
}
],
"schema": {
diff --git a/src/content/workers-ai-models/bge-base-en-v1.5.json b/src/content/workers-ai-models/bge-base-en-v1.5.json
index 0436c5e9269d49..0f11c5adee81a2 100644
--- a/src/content/workers-ai-models/bge-base-en-v1.5.json
+++ b/src/content/workers-ai-models/bge-base-en-v1.5.json
@@ -11,6 +11,10 @@
"created_at": "2023-09-25 19:21:11.898",
"tags": [],
"properties": [
+ {
+ "property_id": "async_queue",
+ "value": "true"
+ },
{
"property_id": "price",
"value": [
@@ -37,53 +41,135 @@
"schema": {
"input": {
"type": "object",
- "properties": {
- "text": {
- "oneOf": [
- {
- "type": "string",
- "description": "The text to embed",
- "minLength": 1
+ "oneOf": [
+ {
+ "properties": {
+ "text": {
+ "oneOf": [
+ {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ {
+ "type": "array",
+ "description": "Batch of text values to embed",
+ "items": {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ "maxItems": 100
+ }
+ ]
},
- {
+ "pooling": {
+ "type": "string",
+ "enum": [
+ "mean",
+ "cls"
+ ],
+ "default": "mean",
+ "description": "The pooling method used in the embedding process. `cls` pooling will generate more accurate embeddings on larger inputs - however, embeddings created with cls pooling are not compatible with embeddings generated with mean pooling. The default pooling method is `mean` in order for this to not be a breaking change, but we highly suggest using the new `cls` pooling for better accuracy."
+ }
+ },
+ "required": [
+ "text"
+ ]
+ },
+ {
+ "properties": {
+ "requests": {
"type": "array",
- "description": "Batch of text values to embed",
+ "description": "Batch of the embeddings requests to run using async-queue",
"items": {
- "type": "string",
- "description": "The text to embed",
- "minLength": 1
- },
- "maxItems": 100
+ "properties": {
+ "text": {
+ "oneOf": [
+ {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ {
+ "type": "array",
+ "description": "Batch of text values to embed",
+ "items": {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ "maxItems": 100
+ }
+ ]
+ },
+ "pooling": {
+ "type": "string",
+ "enum": [
+ "mean",
+ "cls"
+ ],
+ "default": "mean",
+ "description": "The pooling method used in the embedding process. `cls` pooling will generate more accurate embeddings on larger inputs - however, embeddings created with cls pooling are not compatible with embeddings generated with mean pooling. The default pooling method is `mean` in order for this to not be a breaking change, but we highly suggest using the new `cls` pooling for better accuracy."
+ }
+ },
+ "required": [
+ "text"
+ ]
+ }
}
+ },
+ "required": [
+ "requests"
]
}
- },
- "required": [
- "text"
]
},
"output": {
- "type": "object",
- "contentType": "application/json",
- "properties": {
- "shape": {
- "type": "array",
- "items": {
- "type": "number"
+ "oneOf": [
+ {
+ "type": "object",
+ "contentType": "application/json",
+ "properties": {
+ "shape": {
+ "type": "array",
+ "items": {
+ "type": "number"
+ }
+ },
+ "data": {
+ "type": "array",
+ "description": "Embeddings of the requested text values",
+ "items": {
+ "type": "array",
+ "description": "Floating point embedding representation shaped by the embedding model",
+ "items": {
+ "type": "number"
+ }
+ }
+ },
+ "pooling": {
+ "type": "string",
+ "enum": [
+ "mean",
+ "cls"
+ ],
+ "description": "The pooling method used in the embedding process."
+ }
}
},
- "data": {
- "type": "array",
- "description": "Embeddings of the requested text values",
- "items": {
- "type": "array",
- "description": "Floating point embedding representation shaped by the embedding model",
- "items": {
- "type": "number"
+ {
+ "type": "object",
+ "contentType": "application/json",
+ "title": "Async response",
+ "properties": {
+ "request_id": {
+ "type": "string",
+ "description": "The async request id that can be used to obtain the results."
}
}
}
- }
+ ]
}
}
}
\ No newline at end of file
diff --git a/src/content/workers-ai-models/bge-large-en-v1.5.json b/src/content/workers-ai-models/bge-large-en-v1.5.json
index a12d446087784a..fb514b587d41dc 100644
--- a/src/content/workers-ai-models/bge-large-en-v1.5.json
+++ b/src/content/workers-ai-models/bge-large-en-v1.5.json
@@ -11,6 +11,10 @@
"created_at": "2023-11-07 15:43:58.042",
"tags": [],
"properties": [
+ {
+ "property_id": "async_queue",
+ "value": "true"
+ },
{
"property_id": "price",
"value": [
@@ -23,7 +27,7 @@
},
{
"property_id": "info",
- "value": "https://huggingface.co/BAAI/bge-base-en-v1.5"
+ "value": "https://huggingface.co/BAAI/bge-large-en-v1.5"
},
{
"property_id": "max_input_tokens",
@@ -37,53 +41,135 @@
"schema": {
"input": {
"type": "object",
- "properties": {
- "text": {
- "oneOf": [
- {
- "type": "string",
- "description": "The text to embed",
- "minLength": 1
+ "oneOf": [
+ {
+ "properties": {
+ "text": {
+ "oneOf": [
+ {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ {
+ "type": "array",
+ "description": "Batch of text values to embed",
+ "items": {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ "maxItems": 100
+ }
+ ]
},
- {
+ "pooling": {
+ "type": "string",
+ "enum": [
+ "mean",
+ "cls"
+ ],
+ "default": "mean",
+ "description": "The pooling method used in the embedding process. `cls` pooling will generate more accurate embeddings on larger inputs - however, embeddings created with cls pooling are not compatible with embeddings generated with mean pooling. The default pooling method is `mean` in order for this to not be a breaking change, but we highly suggest using the new `cls` pooling for better accuracy."
+ }
+ },
+ "required": [
+ "text"
+ ]
+ },
+ {
+ "properties": {
+ "requests": {
"type": "array",
- "description": "Batch of text values to embed",
+ "description": "Batch of the embeddings requests to run using async-queue",
"items": {
- "type": "string",
- "description": "The text to embed",
- "minLength": 1
- },
- "maxItems": 100
+ "properties": {
+ "text": {
+ "oneOf": [
+ {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ {
+ "type": "array",
+ "description": "Batch of text values to embed",
+ "items": {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ "maxItems": 100
+ }
+ ]
+ },
+ "pooling": {
+ "type": "string",
+ "enum": [
+ "mean",
+ "cls"
+ ],
+ "default": "mean",
+ "description": "The pooling method used in the embedding process. `cls` pooling will generate more accurate embeddings on larger inputs - however, embeddings created with cls pooling are not compatible with embeddings generated with mean pooling. The default pooling method is `mean` in order for this to not be a breaking change, but we highly suggest using the new `cls` pooling for better accuracy."
+ }
+ },
+ "required": [
+ "text"
+ ]
+ }
}
+ },
+ "required": [
+ "requests"
]
}
- },
- "required": [
- "text"
]
},
"output": {
- "type": "object",
- "contentType": "application/json",
- "properties": {
- "shape": {
- "type": "array",
- "items": {
- "type": "number"
+ "oneOf": [
+ {
+ "type": "object",
+ "contentType": "application/json",
+ "properties": {
+ "shape": {
+ "type": "array",
+ "items": {
+ "type": "number"
+ }
+ },
+ "data": {
+ "type": "array",
+ "description": "Embeddings of the requested text values",
+ "items": {
+ "type": "array",
+ "description": "Floating point embedding representation shaped by the embedding model",
+ "items": {
+ "type": "number"
+ }
+ }
+ },
+ "pooling": {
+ "type": "string",
+ "enum": [
+ "mean",
+ "cls"
+ ],
+ "description": "The pooling method used in the embedding process."
+ }
}
},
- "data": {
- "type": "array",
- "description": "Embeddings of the requested text values",
- "items": {
- "type": "array",
- "description": "Floating point embedding representation shaped by the embedding model",
- "items": {
- "type": "number"
+ {
+ "type": "object",
+ "contentType": "application/json",
+ "title": "Async response",
+ "properties": {
+ "request_id": {
+ "type": "string",
+ "description": "The async request id that can be used to obtain the results."
}
}
}
- }
+ ]
}
}
}
\ No newline at end of file
diff --git a/src/content/workers-ai-models/bge-m3.json b/src/content/workers-ai-models/bge-m3.json
index 5020665ee9eec9..02420e31c02c72 100644
--- a/src/content/workers-ai-models/bge-m3.json
+++ b/src/content/workers-ai-models/bge-m3.json
@@ -11,6 +11,10 @@
"created_at": "2024-05-22 19:27:09.781",
"tags": [],
"properties": [
+ {
+ "property_id": "async_queue",
+ "value": "true"
+ },
{
"property_id": "price",
"value": [
@@ -89,6 +93,86 @@
"required": [
"text"
]
+ },
+ {
+ "properties": {
+ "requests": {
+ "type": "array",
+ "description": "Batch of the embeddings requests to run using async-queue",
+ "items": {
+ "type": "object",
+ "oneOf": [
+ {
+ "title": "BGE M3 Input Query and Contexts",
+ "properties": {
+ "query": {
+ "type": "string",
+ "minLength": 1,
+ "description": "A query you wish to perform against the provided contexts. If no query is provided the model with respond with embeddings for contexts"
+ },
+ "contexts": {
+ "type": "array",
+ "items": {
+ "type": "object",
+ "properties": {
+ "text": {
+ "type": "string",
+ "minLength": 1,
+ "description": "One of the provided context content"
+ }
+ }
+ },
+ "description": "List of provided contexts. Note that the index in this array is important, as the response will refer to it."
+ },
+ "truncate_inputs": {
+ "type": "boolean",
+ "default": false,
+ "description": "When provided with too long context should the model error out or truncate the context to fit?"
+ }
+ },
+ "required": [
+ "contexts"
+ ]
+ },
+ {
+ "title": "BGE M3 Input Embedding",
+ "properties": {
+ "text": {
+ "oneOf": [
+ {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ {
+ "type": "array",
+ "description": "Batch of text values to embed",
+ "items": {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ "maxItems": 100
+ }
+ ]
+ },
+ "truncate_inputs": {
+ "type": "boolean",
+ "default": false,
+ "description": "When provided with too long context should the model error out or truncate the context to fit?"
+ }
+ },
+ "required": [
+ "text"
+ ]
+ }
+ ]
+ }
+ }
+ },
+ "required": [
+ "requests"
+ ]
}
]
},
@@ -174,6 +258,17 @@
"description": "The pooling method used in the embedding process."
}
}
+ },
+ {
+ "type": "object",
+ "contentType": "application/json",
+ "title": "Async response",
+ "properties": {
+ "request_id": {
+ "type": "string",
+ "description": "The async request id that can be used to obtain the results."
+ }
+ }
}
]
}
diff --git a/src/content/workers-ai-models/bge-reranker-base.json b/src/content/workers-ai-models/bge-reranker-base.json
index 2a6b997ae93a53..68f1cc2e25aa2b 100644
--- a/src/content/workers-ai-models/bge-reranker-base.json
+++ b/src/content/workers-ai-models/bge-reranker-base.json
@@ -10,7 +10,18 @@
},
"created_at": "2025-02-14 12:28:19.009",
"tags": [],
- "properties": [],
+ "properties": [
+ {
+ "property_id": "price",
+ "value": [
+ {
+ "unit": "per M input tokens",
+ "price": 0.0031,
+ "currency": "USD"
+ }
+ ]
+ }
+ ],
"schema": {
"input": {
"type": "object",
diff --git a/src/content/workers-ai-models/bge-small-en-v1.5.json b/src/content/workers-ai-models/bge-small-en-v1.5.json
index 90a04f9672920f..13203c5a65b5b0 100644
--- a/src/content/workers-ai-models/bge-small-en-v1.5.json
+++ b/src/content/workers-ai-models/bge-small-en-v1.5.json
@@ -11,6 +11,10 @@
"created_at": "2023-11-07 15:43:58.042",
"tags": [],
"properties": [
+ {
+ "property_id": "async_queue",
+ "value": "true"
+ },
{
"property_id": "price",
"value": [
@@ -37,53 +41,135 @@
"schema": {
"input": {
"type": "object",
- "properties": {
- "text": {
- "oneOf": [
- {
- "type": "string",
- "description": "The text to embed",
- "minLength": 1
+ "oneOf": [
+ {
+ "properties": {
+ "text": {
+ "oneOf": [
+ {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ {
+ "type": "array",
+ "description": "Batch of text values to embed",
+ "items": {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ "maxItems": 100
+ }
+ ]
},
- {
+ "pooling": {
+ "type": "string",
+ "enum": [
+ "mean",
+ "cls"
+ ],
+ "default": "mean",
+ "description": "The pooling method used in the embedding process. `cls` pooling will generate more accurate embeddings on larger inputs - however, embeddings created with cls pooling are not compatible with embeddings generated with mean pooling. The default pooling method is `mean` in order for this to not be a breaking change, but we highly suggest using the new `cls` pooling for better accuracy."
+ }
+ },
+ "required": [
+ "text"
+ ]
+ },
+ {
+ "properties": {
+ "requests": {
"type": "array",
- "description": "Batch of text values to embed",
+ "description": "Batch of the embeddings requests to run using async-queue",
"items": {
- "type": "string",
- "description": "The text to embed",
- "minLength": 1
- },
- "maxItems": 100
+ "properties": {
+ "text": {
+ "oneOf": [
+ {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ {
+ "type": "array",
+ "description": "Batch of text values to embed",
+ "items": {
+ "type": "string",
+ "description": "The text to embed",
+ "minLength": 1
+ },
+ "maxItems": 100
+ }
+ ]
+ },
+ "pooling": {
+ "type": "string",
+ "enum": [
+ "mean",
+ "cls"
+ ],
+ "default": "mean",
+ "description": "The pooling method used in the embedding process. `cls` pooling will generate more accurate embeddings on larger inputs - however, embeddings created with cls pooling are not compatible with embeddings generated with mean pooling. The default pooling method is `mean` in order for this to not be a breaking change, but we highly suggest using the new `cls` pooling for better accuracy."
+ }
+ },
+ "required": [
+ "text"
+ ]
+ }
}
+ },
+ "required": [
+ "requests"
]
}
- },
- "required": [
- "text"
]
},
"output": {
- "type": "object",
- "contentType": "application/json",
- "properties": {
- "shape": {
- "type": "array",
- "items": {
- "type": "number"
+ "oneOf": [
+ {
+ "type": "object",
+ "contentType": "application/json",
+ "properties": {
+ "shape": {
+ "type": "array",
+ "items": {
+ "type": "number"
+ }
+ },
+ "data": {
+ "type": "array",
+ "description": "Embeddings of the requested text values",
+ "items": {
+ "type": "array",
+ "description": "Floating point embedding representation shaped by the embedding model",
+ "items": {
+ "type": "number"
+ }
+ }
+ },
+ "pooling": {
+ "type": "string",
+ "enum": [
+ "mean",
+ "cls"
+ ],
+ "description": "The pooling method used in the embedding process."
+ }
}
},
- "data": {
- "type": "array",
- "description": "Embeddings of the requested text values",
- "items": {
- "type": "array",
- "description": "Floating point embedding representation shaped by the embedding model",
- "items": {
- "type": "number"
+ {
+ "type": "object",
+ "contentType": "application/json",
+ "title": "Async response",
+ "properties": {
+ "request_id": {
+ "type": "string",
+ "description": "The async request id that can be used to obtain the results."
}
}
}
- }
+ ]
}
}
}
\ No newline at end of file
diff --git a/src/content/workers-ai-models/deepseek-r1-distill-qwen-32b.json b/src/content/workers-ai-models/deepseek-r1-distill-qwen-32b.json
index 957c5d62de8fda..18959db015dcd3 100644
--- a/src/content/workers-ai-models/deepseek-r1-distill-qwen-32b.json
+++ b/src/content/workers-ai-models/deepseek-r1-distill-qwen-32b.json
@@ -11,6 +11,10 @@
"created_at": "2025-01-22 19:48:55.776",
"tags": [],
"properties": [
+ {
+ "property_id": "context_window",
+ "value": "80000"
+ },
{
"property_id": "price",
"value": [
diff --git a/src/content/workers-ai-models/detr-resnet-50.json b/src/content/workers-ai-models/detr-resnet-50.json
index de6068019228c2..ae6dbfa8fa7742 100644
--- a/src/content/workers-ai-models/detr-resnet-50.json
+++ b/src/content/workers-ai-models/detr-resnet-50.json
@@ -14,6 +14,16 @@
{
"property_id": "beta",
"value": "true"
+ },
+ {
+ "property_id": "price",
+ "value": [
+ {
+ "unit": "per inference request",
+ "price": 0.0000075,
+ "currency": "USD"
+ }
+ ]
}
],
"schema": {
diff --git a/src/content/workers-ai-models/llama-3.2-11b-vision-instruct.json b/src/content/workers-ai-models/llama-3.2-11b-vision-instruct.json
index 19413dd77819ce..c767b1a5c86324 100644
--- a/src/content/workers-ai-models/llama-3.2-11b-vision-instruct.json
+++ b/src/content/workers-ai-models/llama-3.2-11b-vision-instruct.json
@@ -26,6 +26,10 @@
}
]
},
+ {
+ "property_id": "lora",
+ "value": "true"
+ },
{
"property_id": "terms",
"value": "https://github.com/meta-llama/llama-models/blob/main/models/llama3_2/LICENSE"
diff --git a/src/content/workers-ai-models/llama-3.3-70b-instruct-fp8-fast.json b/src/content/workers-ai-models/llama-3.3-70b-instruct-fp8-fast.json
index 4835f933d7d11f..fcd30b094e9b37 100644
--- a/src/content/workers-ai-models/llama-3.3-70b-instruct-fp8-fast.json
+++ b/src/content/workers-ai-models/llama-3.3-70b-instruct-fp8-fast.json
@@ -11,6 +11,10 @@
"created_at": "2024-12-06 17:09:18.338",
"tags": [],
"properties": [
+ {
+ "property_id": "context_window",
+ "value": "24000"
+ },
{
"property_id": "price",
"value": [
@@ -26,10 +30,6 @@
}
]
},
- {
- "property_id": "context_window",
- "value": "24000"
- },
{
"property_id": "function_calling",
"value": "true"
diff --git a/src/content/workers-ai-models/llama-4-scout-17b-16e-instruct.json b/src/content/workers-ai-models/llama-4-scout-17b-16e-instruct.json
index 1f9e754c18bd5f..a7db2042ed7a15 100644
--- a/src/content/workers-ai-models/llama-4-scout-17b-16e-instruct.json
+++ b/src/content/workers-ai-models/llama-4-scout-17b-16e-instruct.json
@@ -11,17 +11,21 @@
"created_at": "2025-04-05 20:25:56.137",
"tags": [],
"properties": [
+ {
+ "property_id": "context_window",
+ "value": "131000"
+ },
{
"property_id": "price",
"value": [
{
"unit": "per M input tokens",
- "price": 0.27,
+ "price": 0,
"currency": "USD"
},
{
"unit": "per M output tokens",
- "price": 0.85,
+ "price": 0,
"currency": "USD"
}
]
@@ -43,9 +47,9 @@
"minLength": 1,
"description": "The input text prompt for the model to generate a response."
},
- "lora": {
- "type": "string",
- "description": "Name of the LoRA (Low-Rank Adaptation) model to fine-tune the base model."
+ "guided_json": {
+ "type": "object",
+ "description": "JSON schema that should be fulfilled for the response."
},
"response_format": {
"title": "JSON Mode",
@@ -78,7 +82,7 @@
},
"temperature": {
"type": "number",
- "default": 0.6,
+ "default": 0.15,
"minimum": 0,
"maximum": 5,
"description": "Controls the randomness of the output; higher values produce more random results."
@@ -137,15 +141,67 @@
"type": "string",
"description": "The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool')."
},
- "content": {
+ "tool_call_id": {
"type": "string",
- "description": "The content of the message as a string."
+ "description": "The tool call id. Must be supplied for tool calls for Mistral-3. If you don't know what to put here you can fall back to 000000001",
+ "pattern": "[a-zA-Z0-9]{9}"
+ },
+ "content": {
+ "oneOf": [
+ {
+ "type": "string",
+ "description": "The content of the message as a string."
+ },
+ {
+ "type": "array",
+ "items": {
+ "type": "object",
+ "properties": {
+ "type": {
+ "type": "string",
+ "description": "Type of the content provided"
+ },
+ "text": {
+ "type": "string"
+ },
+ "image_url": {
+ "type": "object",
+ "properties": {
+ "url": {
+ "type": "string",
+ "pattern": "^data:*",
+ "description": "image uri with data (e.g. ...). HTTP URL will not be accepted"
+ }
+ }
+ }
+ }
+ }
+ },
+ {
+ "type": "object",
+ "properties": {
+ "type": {
+ "type": "string",
+ "description": "Type of the content provided"
+ },
+ "text": {
+ "type": "string"
+ },
+ "image_url": {
+ "type": "object",
+ "properties": {
+ "url": {
+ "type": "string",
+ "pattern": "^data:*",
+ "description": "image uri with data (e.g. ...). HTTP URL will not be accepted"
+ }
+ }
+ }
+ }
+ }
+ ]
}
- },
- "required": [
- "role",
- "content"
- ]
+ }
}
},
"functions": {
@@ -321,6 +377,10 @@
"json_schema": {}
}
},
+ "guided_json": {
+ "type": "object",
+ "description": "JSON schema that should be fufilled for the response."
+ },
"raw": {
"type": "boolean",
"default": false,
@@ -338,7 +398,7 @@
},
"temperature": {
"type": "number",
- "default": 0.6,
+ "default": 0.15,
"minimum": 0,
"maximum": 5,
"description": "Controls the randomness of the output; higher values produce more random results."
@@ -390,6 +450,7 @@
"oneOf": [
{
"type": "object",
+ "contentType": "application/json",
"properties": {
"response": {
"type": "string",
@@ -440,6 +501,7 @@
},
{
"type": "string",
+ "contentType": "text/event-stream",
"format": "binary"
}
]
diff --git a/src/content/workers-ai-models/llama-guard-3-8b.json b/src/content/workers-ai-models/llama-guard-3-8b.json
index 77b1872ea2d9e0..5f5d39495289ca 100644
--- a/src/content/workers-ai-models/llama-guard-3-8b.json
+++ b/src/content/workers-ai-models/llama-guard-3-8b.json
@@ -25,6 +25,10 @@
"currency": "USD"
}
]
+ },
+ {
+ "property_id": "lora",
+ "value": "true"
}
],
"schema": {
diff --git a/src/content/workers-ai-models/m2m100-1.2b.json b/src/content/workers-ai-models/m2m100-1.2b.json
index e3bcfdace56ea9..022b7dcca7897a 100644
--- a/src/content/workers-ai-models/m2m100-1.2b.json
+++ b/src/content/workers-ai-models/m2m100-1.2b.json
@@ -11,6 +11,10 @@
"created_at": "2023-09-25 19:21:11.898",
"tags": [],
"properties": [
+ {
+ "property_id": "async_queue",
+ "value": "true"
+ },
{
"property_id": "price",
"value": [
@@ -42,36 +46,89 @@
"schema": {
"input": {
"type": "object",
- "properties": {
- "text": {
- "type": "string",
- "minLength": 1,
- "description": "The text to be translated"
- },
- "source_lang": {
- "type": "string",
- "default": "en",
- "description": "The language code of the source text (e.g., 'en' for English). Defaults to 'en' if not specified"
+ "oneOf": [
+ {
+ "properties": {
+ "text": {
+ "type": "string",
+ "minLength": 1,
+ "description": "The text to be translated"
+ },
+ "source_lang": {
+ "type": "string",
+ "default": "en",
+ "description": "The language code of the source text (e.g., 'en' for English). Defaults to 'en' if not specified"
+ },
+ "target_lang": {
+ "type": "string",
+ "description": "The language code to translate the text into (e.g., 'es' for Spanish)"
+ }
+ },
+ "required": [
+ "text",
+ "target_lang"
+ ]
},
- "target_lang": {
- "type": "string",
- "description": "The language code to translate the text into (e.g., 'es' for Spanish)"
+ {
+ "properties": {
+ "requests": {
+ "type": "array",
+ "description": "Batch of the embeddings requests to run using async-queue",
+ "items": {
+ "type": "object",
+ "properties": {
+ "text": {
+ "type": "string",
+ "minLength": 1,
+ "description": "The text to be translated"
+ },
+ "source_lang": {
+ "type": "string",
+ "default": "en",
+ "description": "The language code of the source text (e.g., 'en' for English). Defaults to 'en' if not specified"
+ },
+ "target_lang": {
+ "type": "string",
+ "description": "The language code to translate the text into (e.g., 'es' for Spanish)"
+ }
+ },
+ "required": [
+ "text",
+ "target_lang"
+ ]
+ }
+ }
+ },
+ "required": [
+ "requests"
+ ]
}
- },
- "required": [
- "text",
- "target_lang"
]
},
"output": {
"type": "object",
"contentType": "application/json",
- "properties": {
- "translated_text": {
- "type": "string",
- "description": "The translated text in the target language"
+ "oneOf": [
+ {
+ "properties": {
+ "translated_text": {
+ "type": "string",
+ "description": "The translated text in the target language"
+ }
+ }
+ },
+ {
+ "type": "object",
+ "contentType": "application/json",
+ "title": "Async response",
+ "properties": {
+ "request_id": {
+ "type": "string",
+ "description": "The async request id that can be used to obtain the results."
+ }
+ }
}
- }
+ ]
}
}
}
\ No newline at end of file
diff --git a/src/content/workers-ai-models/melotts.json b/src/content/workers-ai-models/melotts.json
index 63e9a49a80b952..55d9cc3a9bd144 100644
--- a/src/content/workers-ai-models/melotts.json
+++ b/src/content/workers-ai-models/melotts.json
@@ -10,7 +10,18 @@
},
"created_at": "2024-07-19 15:51:04.819",
"tags": [],
- "properties": [],
+ "properties": [
+ {
+ "property_id": "price",
+ "value": [
+ {
+ "unit": "per audio minute",
+ "price": 0.0002,
+ "currency": "USD"
+ }
+ ]
+ }
+ ],
"schema": {
"input": {
"type": "object",
diff --git a/src/content/workers-ai-models/stable-diffusion-v1-5-img2img.json b/src/content/workers-ai-models/stable-diffusion-v1-5-img2img.json
index 14e21b3b6101d2..493f47248141cf 100644
--- a/src/content/workers-ai-models/stable-diffusion-v1-5-img2img.json
+++ b/src/content/workers-ai-models/stable-diffusion-v1-5-img2img.json
@@ -15,6 +15,16 @@
"property_id": "beta",
"value": "true"
},
+ {
+ "property_id": "price",
+ "value": [
+ {
+ "unit": "per step",
+ "price": 0,
+ "currency": "USD"
+ }
+ ]
+ },
{
"property_id": "info",
"value": "https://huggingface.co/runwayml/stable-diffusion-v1-5"
diff --git a/src/content/workers-ai-models/stable-diffusion-v1-5-inpainting.json b/src/content/workers-ai-models/stable-diffusion-v1-5-inpainting.json
index ab7347ee61cf92..22188f1a18d884 100644
--- a/src/content/workers-ai-models/stable-diffusion-v1-5-inpainting.json
+++ b/src/content/workers-ai-models/stable-diffusion-v1-5-inpainting.json
@@ -15,6 +15,16 @@
"property_id": "beta",
"value": "true"
},
+ {
+ "property_id": "price",
+ "value": [
+ {
+ "unit": "per step",
+ "price": 0,
+ "currency": "USD"
+ }
+ ]
+ },
{
"property_id": "info",
"value": "https://huggingface.co/runwayml/stable-diffusion-inpainting"
diff --git a/src/content/workers-ai-models/stable-diffusion-xl-base-1.0.json b/src/content/workers-ai-models/stable-diffusion-xl-base-1.0.json
index 029b714cc1e44c..bfeb09a16a161e 100644
--- a/src/content/workers-ai-models/stable-diffusion-xl-base-1.0.json
+++ b/src/content/workers-ai-models/stable-diffusion-xl-base-1.0.json
@@ -15,6 +15,16 @@
"property_id": "beta",
"value": "true"
},
+ {
+ "property_id": "price",
+ "value": [
+ {
+ "unit": "per step",
+ "price": 0,
+ "currency": "USD"
+ }
+ ]
+ },
{
"property_id": "info",
"value": "https://stability.ai/stable-diffusion"
diff --git a/src/content/workers-ai-models/stable-diffusion-xl-lightning.json b/src/content/workers-ai-models/stable-diffusion-xl-lightning.json
index 0f0ac46b754b7e..19e57d6388975d 100644
--- a/src/content/workers-ai-models/stable-diffusion-xl-lightning.json
+++ b/src/content/workers-ai-models/stable-diffusion-xl-lightning.json
@@ -15,6 +15,16 @@
"property_id": "beta",
"value": "true"
},
+ {
+ "property_id": "price",
+ "value": [
+ {
+ "unit": "per step",
+ "price": 0,
+ "currency": "USD"
+ }
+ ]
+ },
{
"property_id": "info",
"value": "https://huggingface.co/ByteDance/SDXL-Lightning"