[Workers AI] Models update

kodster28 · kodster28 · commit ffb1bb4f60ed · 2025-09-04T16:53:58.000-05:00
diff --git a/src/content/workers-ai-models/aura-1.json b/src/content/workers-ai-models/aura-1.json
@@ -15,23 +15,23 @@
             "property_id": "async_queue",
             "value": "true"
         },
-        {
-            "property_id": "partner",
-            "value": "true"
-        },
-        {
-            "property_id": "realtime",
-            "value": "true"
-        },
         {
             "property_id": "price",
             "value": [
                 {
-                    "unit": "per 1k characters",
-                    "price": 0.0150,
+                    "unit": "per audio minute",
+                    "price": 0,
                     "currency": "USD"
                 }
             ]
+        },
+        {
+            "property_id": "partner",
+            "value": "true"
+        },
+        {
+            "property_id": "realtime",
+            "value": "true"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/deepseek-coder-6.7b-base-awq.json b/src/content/workers-ai-models/deepseek-coder-6.7b-base-awq.json
@@ -19,6 +19,10 @@
             "property_id": "context_window",
             "value": "4096"
         },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
+        },
         {
             "property_id": "terms",
             "value": "https://huggingface.co/TheBloke/deepseek-coder-6.7B-base-AWQ"
diff --git a/src/content/workers-ai-models/deepseek-coder-6.7b-instruct-awq.json b/src/content/workers-ai-models/deepseek-coder-6.7b-instruct-awq.json
@@ -19,6 +19,10 @@
             "property_id": "context_window",
             "value": "4096"
         },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
+        },
         {
             "property_id": "terms",
             "value": "https://huggingface.co/TheBloke/deepseek-coder-6.7B-instruct-AWQ"
diff --git a/src/content/workers-ai-models/deepseek-math-7b-instruct.json b/src/content/workers-ai-models/deepseek-math-7b-instruct.json
@@ -23,6 +23,10 @@
             "property_id": "info",
             "value": "https://huggingface.co/deepseek-ai/deepseek-math-7b-instruct"
         },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
+        },
         {
             "property_id": "terms",
             "value": "https://github.com/deepseek-ai/DeepSeek-Math/blob/main/LICENSE-MODEL"
diff --git a/src/content/workers-ai-models/discolm-german-7b-v1-awq.json b/src/content/workers-ai-models/discolm-german-7b-v1-awq.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/TheBloke/DiscoLM_German_7b_v1-AWQ"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/falcon-7b-instruct.json b/src/content/workers-ai-models/falcon-7b-instruct.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/tiiuae/falcon-7b-instruct"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/gpt-oss-20b.json b/src/content/workers-ai-models/gpt-oss-20b.json
@@ -11,6 +11,10 @@
     "created_at": "2025-08-05 10:49:53.265",
     "tags": [],
     "properties": [
+        {
+            "property_id": "async_queue",
+            "value": "true"
+        },
         {
             "property_id": "context_window",
             "value": "128000"
@@ -33,48 +37,108 @@
     ],
     "schema": {
         "input": {
-            "type": "object",
-            "title": "GPT_OSS_Responses",
-            "properties": {
-                "input": {
-                    "anyOf": [
-                        {
-                            "type": "string"
+            "oneOf": [
+                {
+                    "type": "object",
+                    "title": "GPT_OSS_Responses",
+                    "properties": {
+                        "input": {
+                            "anyOf": [
+                                {
+                                    "type": "string"
+                                },
+                                {
+                                    "items": {},
+                                    "type": "array"
+                                }
+                            ],
+                            "description": "Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types",
+                            "title": "Input"
                         },
-                        {
-                            "items": {},
-                            "type": "array"
+                        "reasoning": {
+                            "type": "object",
+                            "properties": {
+                                "effort": {
+                                    "type": "string",
+                                    "description": "Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.",
+                                    "enum": [
+                                        "low",
+                                        "medium",
+                                        "high"
+                                    ]
+                                },
+                                "summary": {
+                                    "type": "string",
+                                    "description": "A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.",
+                                    "enum": [
+                                        "auto",
+                                        "concise",
+                                        "detailed"
+                                    ]
+                                }
+                            }
                         }
-                    ],
-                    "description": "Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types",
-                    "title": "Input"
+                    },
+                    "required": [
+                        "input"
+                    ]
                 },
-                "reasoning": {
+                {
                     "type": "object",
+                    "title": "GPT_OSS_Responses_Async",
                     "properties": {
-                        "effort": {
-                            "type": "string",
-                            "description": "Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.",
-                            "enum": [
-                                "low",
-                                "medium",
-                                "high"
-                            ]
-                        },
-                        "summary": {
-                            "type": "string",
-                            "description": "A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.",
-                            "enum": [
-                                "auto",
-                                "concise",
-                                "detailed"
-                            ]
+                        "requests": {
+                            "type": "array",
+                            "items": {
+                                "type": "object",
+                                "properties": {
+                                    "input": {
+                                        "anyOf": [
+                                            {
+                                                "type": "string"
+                                            },
+                                            {
+                                                "items": {},
+                                                "type": "array"
+                                            }
+                                        ],
+                                        "description": "Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types",
+                                        "title": "Input"
+                                    },
+                                    "reasoning": {
+                                        "type": "object",
+                                        "properties": {
+                                            "effort": {
+                                                "type": "string",
+                                                "description": "Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.",
+                                                "enum": [
+                                                    "low",
+                                                    "medium",
+                                                    "high"
+                                                ]
+                                            },
+                                            "summary": {
+                                                "type": "string",
+                                                "description": "A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.",
+                                                "enum": [
+                                                    "auto",
+                                                    "concise",
+                                                    "detailed"
+                                                ]
+                                            }
+                                        }
+                                    }
+                                },
+                                "required": [
+                                    "input"
+                                ]
+                            }
                         }
-                    }
+                    },
+                    "required": [
+                        "requests"
+                    ]
                 }
-            },
-            "required": [
-                "input"
             ]
         },
         "output": {
diff --git a/src/content/workers-ai-models/llama-2-13b-chat-awq.json b/src/content/workers-ai-models/llama-2-13b-chat-awq.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/TheBloke/Llama-2-13B-chat-AWQ"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/llamaguard-7b-awq.json b/src/content/workers-ai-models/llamaguard-7b-awq.json
@@ -18,6 +18,10 @@
         {
             "property_id": "context_window",
             "value": "4096"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/mistral-7b-instruct-v0.1-awq.json b/src/content/workers-ai-models/mistral-7b-instruct-v0.1-awq.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-AWQ"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/neural-chat-7b-v3-1-awq.json b/src/content/workers-ai-models/neural-chat-7b-v3-1-awq.json
@@ -18,6 +18,10 @@
         {
             "property_id": "context_window",
             "value": "4096"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/openchat-3.5-0106.json b/src/content/workers-ai-models/openchat-3.5-0106.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/openchat/openchat-3.5-0106"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/openhermes-2.5-mistral-7b-awq.json b/src/content/workers-ai-models/openhermes-2.5-mistral-7b-awq.json
@@ -18,6 +18,10 @@
         {
             "property_id": "context_window",
             "value": "4096"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/qwen1.5-0.5b-chat.json b/src/content/workers-ai-models/qwen1.5-0.5b-chat.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/qwen/qwen1.5-0.5b-chat"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/qwen1.5-1.8b-chat.json b/src/content/workers-ai-models/qwen1.5-1.8b-chat.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/qwen/qwen1.5-1.8b-chat"
+        },
+        {
+            "property_id": "qwen/qwen1.5-1.8b-chat",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/qwen1.5-14b-chat-awq.json b/src/content/workers-ai-models/qwen1.5-14b-chat-awq.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/qwen/qwen1.5-14b-chat-awq"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/qwen1.5-7b-chat-awq.json b/src/content/workers-ai-models/qwen1.5-7b-chat-awq.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/qwen/qwen1.5-7b-chat-awq"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/smart-turn-v2.json b/src/content/workers-ai-models/smart-turn-v2.json
@@ -5,8 +5,8 @@
     "description": "An open source, community-driven, native audio turn detection model in 2nd version",
     "task": {
         "id": "ccb1ca5a-043d-41a7-8a3b-61017b2796fd",
-        "name": "Voice Activity Detection",
-        "description": "Detecting the presence or absence of human speech, used in speech processing."
+        "name": "Dumb Pipe",
+        "description": "Internal - Dumb Pipe models don't use tensors"
     },
     "created_at": "2025-08-04 10:08:04.219",
     "tags": [],
diff --git a/src/content/workers-ai-models/starling-lm-7b-beta.json b/src/content/workers-ai-models/starling-lm-7b-beta.json
@@ -34,6 +34,10 @@
         {
             "property_id": "max_total_tokens",
             "value": "4096"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/tinyllama-1.1b-chat-v1.0.json b/src/content/workers-ai-models/tinyllama-1.1b-chat-v1.0.json
@@ -22,6 +22,10 @@
         {
             "property_id": "info",
             "value": "https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/una-cybertron-7b-v2-bf16.json b/src/content/workers-ai-models/una-cybertron-7b-v2-bf16.json
@@ -18,6 +18,10 @@
         {
             "property_id": "context_window",
             "value": "15000"
+        },
+        {
+            "property_id": "planned_deprecation_date",
+            "value": "2025-10-01"
         }
     ],
     "schema": {
diff --git a/src/content/workers-ai-models/zephyr-7b-beta-awq.json b/src/content/workers-ai-models/zephyr-7b-beta-awq.json

Original file line number	Diff line number	Diff line change
`@@ -22,6 +22,10 @@`
`22`	`22`	`{`
`23`	`23`	`"property_id": "info",`
`24`	`24`	`"value": "https://huggingface.co/TheBloke/DiscoLM_German_7b_v1-AWQ"`
	`25`	`+ },`
	`26`	`+ {`
	`27`	`+ "property_id": "planned_deprecation_date",`
	`28`	`+ "value": "2025-10-01"`
`25`	`29`	`}`
`26`	`30`	`],`
`27`	`31`	`"schema": {`
Original file line number	Diff line number	Diff line change
`@@ -18,6 +18,10 @@`
`18`	`18`	`{`
`19`	`19`	`"property_id": "context_window",`
`20`	`20`	`"value": "4096"`
	`21`	`+ },`
	`22`	`+ {`
	`23`	`+ "property_id": "planned_deprecation_date",`
	`24`	`+ "value": "2025-10-01"`
`21`	`25`	`}`
`22`	`26`	`],`
`23`	`27`	`"schema": {`