Skip to content

Commit ffb1bb4

Browse files
committed
[Workers AI] Models update
1 parent 3152ab7 commit ffb1bb4

22 files changed

+187
-47
lines changed

src/content/workers-ai-models/aura-1.json

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -15,23 +15,23 @@
1515
"property_id": "async_queue",
1616
"value": "true"
1717
},
18-
{
19-
"property_id": "partner",
20-
"value": "true"
21-
},
22-
{
23-
"property_id": "realtime",
24-
"value": "true"
25-
},
2618
{
2719
"property_id": "price",
2820
"value": [
2921
{
30-
"unit": "per 1k characters",
31-
"price": 0.0150,
22+
"unit": "per audio minute",
23+
"price": 0,
3224
"currency": "USD"
3325
}
3426
]
27+
},
28+
{
29+
"property_id": "partner",
30+
"value": "true"
31+
},
32+
{
33+
"property_id": "realtime",
34+
"value": "true"
3535
}
3636
],
3737
"schema": {

src/content/workers-ai-models/deepseek-coder-6.7b-base-awq.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,10 @@
1919
"property_id": "context_window",
2020
"value": "4096"
2121
},
22+
{
23+
"property_id": "planned_deprecation_date",
24+
"value": "2025-10-01"
25+
},
2226
{
2327
"property_id": "terms",
2428
"value": "https://huggingface.co/TheBloke/deepseek-coder-6.7B-base-AWQ"

src/content/workers-ai-models/deepseek-coder-6.7b-instruct-awq.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,10 @@
1919
"property_id": "context_window",
2020
"value": "4096"
2121
},
22+
{
23+
"property_id": "planned_deprecation_date",
24+
"value": "2025-10-01"
25+
},
2226
{
2327
"property_id": "terms",
2428
"value": "https://huggingface.co/TheBloke/deepseek-coder-6.7B-instruct-AWQ"

src/content/workers-ai-models/deepseek-math-7b-instruct.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,10 @@
2323
"property_id": "info",
2424
"value": "https://huggingface.co/deepseek-ai/deepseek-math-7b-instruct"
2525
},
26+
{
27+
"property_id": "planned_deprecation_date",
28+
"value": "2025-10-01"
29+
},
2630
{
2731
"property_id": "terms",
2832
"value": "https://github.com/deepseek-ai/DeepSeek-Math/blob/main/LICENSE-MODEL"

src/content/workers-ai-models/discolm-german-7b-v1-awq.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,10 @@
2222
{
2323
"property_id": "info",
2424
"value": "https://huggingface.co/TheBloke/DiscoLM_German_7b_v1-AWQ"
25+
},
26+
{
27+
"property_id": "planned_deprecation_date",
28+
"value": "2025-10-01"
2529
}
2630
],
2731
"schema": {

src/content/workers-ai-models/falcon-7b-instruct.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,10 @@
2222
{
2323
"property_id": "info",
2424
"value": "https://huggingface.co/tiiuae/falcon-7b-instruct"
25+
},
26+
{
27+
"property_id": "planned_deprecation_date",
28+
"value": "2025-10-01"
2529
}
2630
],
2731
"schema": {

src/content/workers-ai-models/gpt-oss-20b.json

Lines changed: 99 additions & 35 deletions
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,10 @@
1111
"created_at": "2025-08-05 10:49:53.265",
1212
"tags": [],
1313
"properties": [
14+
{
15+
"property_id": "async_queue",
16+
"value": "true"
17+
},
1418
{
1519
"property_id": "context_window",
1620
"value": "128000"
@@ -33,48 +37,108 @@
3337
],
3438
"schema": {
3539
"input": {
36-
"type": "object",
37-
"title": "GPT_OSS_Responses",
38-
"properties": {
39-
"input": {
40-
"anyOf": [
41-
{
42-
"type": "string"
40+
"oneOf": [
41+
{
42+
"type": "object",
43+
"title": "GPT_OSS_Responses",
44+
"properties": {
45+
"input": {
46+
"anyOf": [
47+
{
48+
"type": "string"
49+
},
50+
{
51+
"items": {},
52+
"type": "array"
53+
}
54+
],
55+
"description": "Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types",
56+
"title": "Input"
4357
},
44-
{
45-
"items": {},
46-
"type": "array"
58+
"reasoning": {
59+
"type": "object",
60+
"properties": {
61+
"effort": {
62+
"type": "string",
63+
"description": "Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.",
64+
"enum": [
65+
"low",
66+
"medium",
67+
"high"
68+
]
69+
},
70+
"summary": {
71+
"type": "string",
72+
"description": "A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.",
73+
"enum": [
74+
"auto",
75+
"concise",
76+
"detailed"
77+
]
78+
}
79+
}
4780
}
48-
],
49-
"description": "Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types",
50-
"title": "Input"
81+
},
82+
"required": [
83+
"input"
84+
]
5185
},
52-
"reasoning": {
86+
{
5387
"type": "object",
88+
"title": "GPT_OSS_Responses_Async",
5489
"properties": {
55-
"effort": {
56-
"type": "string",
57-
"description": "Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.",
58-
"enum": [
59-
"low",
60-
"medium",
61-
"high"
62-
]
63-
},
64-
"summary": {
65-
"type": "string",
66-
"description": "A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.",
67-
"enum": [
68-
"auto",
69-
"concise",
70-
"detailed"
71-
]
90+
"requests": {
91+
"type": "array",
92+
"items": {
93+
"type": "object",
94+
"properties": {
95+
"input": {
96+
"anyOf": [
97+
{
98+
"type": "string"
99+
},
100+
{
101+
"items": {},
102+
"type": "array"
103+
}
104+
],
105+
"description": "Responses API Input messages. Refer to OpenAI Responses API docs to learn more about supported content types",
106+
"title": "Input"
107+
},
108+
"reasoning": {
109+
"type": "object",
110+
"properties": {
111+
"effort": {
112+
"type": "string",
113+
"description": "Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.",
114+
"enum": [
115+
"low",
116+
"medium",
117+
"high"
118+
]
119+
},
120+
"summary": {
121+
"type": "string",
122+
"description": "A summary of the reasoning performed by the model. This can be useful for debugging and understanding the model's reasoning process. One of auto, concise, or detailed.",
123+
"enum": [
124+
"auto",
125+
"concise",
126+
"detailed"
127+
]
128+
}
129+
}
130+
}
131+
},
132+
"required": [
133+
"input"
134+
]
135+
}
72136
}
73-
}
137+
},
138+
"required": [
139+
"requests"
140+
]
74141
}
75-
},
76-
"required": [
77-
"input"
78142
]
79143
},
80144
"output": {

src/content/workers-ai-models/llama-2-13b-chat-awq.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,10 @@
2222
{
2323
"property_id": "info",
2424
"value": "https://huggingface.co/TheBloke/Llama-2-13B-chat-AWQ"
25+
},
26+
{
27+
"property_id": "planned_deprecation_date",
28+
"value": "2025-10-01"
2529
}
2630
],
2731
"schema": {

src/content/workers-ai-models/llamaguard-7b-awq.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,10 @@
1818
{
1919
"property_id": "context_window",
2020
"value": "4096"
21+
},
22+
{
23+
"property_id": "planned_deprecation_date",
24+
"value": "2025-10-01"
2125
}
2226
],
2327
"schema": {

src/content/workers-ai-models/mistral-7b-instruct-v0.1-awq.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,10 @@
2222
{
2323
"property_id": "info",
2424
"value": "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-AWQ"
25+
},
26+
{
27+
"property_id": "planned_deprecation_date",
28+
"value": "2025-10-01"
2529
}
2630
],
2731
"schema": {

0 commit comments

Comments
 (0)