Skip to content

Commit 289f7f2

Browse files
committed
[Workers AI] Model updates
1 parent f76e6a9 commit 289f7f2

File tree

9 files changed

+1365
-655
lines changed

9 files changed

+1365
-655
lines changed

src/content/workers-ai-models/aura-1.json

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -15,23 +15,23 @@
1515
"property_id": "async_queue",
1616
"value": "true"
1717
},
18-
{
19-
"property_id": "partner",
20-
"value": "true"
21-
},
22-
{
23-
"property_id": "realtime",
24-
"value": "true"
25-
},
2618
{
2719
"property_id": "price",
2820
"value": [
2921
{
30-
"unit": "per 1k characters",
31-
"price": 0.0150,
22+
"unit": "per audio minute",
23+
"price": 0,
3224
"currency": "USD"
3325
}
3426
]
27+
},
28+
{
29+
"property_id": "partner",
30+
"value": "true"
31+
},
32+
{
33+
"property_id": "realtime",
34+
"value": "true"
3535
}
3636
],
3737
"schema": {

src/content/workers-ai-models/bge-m3.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,10 @@
1515
"property_id": "async_queue",
1616
"value": "true"
1717
},
18+
{
19+
"property_id": "context_window",
20+
"value": "60000"
21+
},
1822
{
1923
"property_id": "price",
2024
"value": [
Lines changed: 32 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
{
2-
"id": "d2f07a41-c152-4061-8083-ec655cbf91a1",
2+
"id": "15631501-2742-4346-a469-22fe202188a2",
33
"source": 1,
44
"name": "@cf/google/embeddinggemma-300m",
55
"description": "EmbeddingGemma is a 300M parameter, state-of-the-art for its size, open embedding model from Google, built from Gemma 3 (with T5Gemma initialization) and the same research and technology used to create Gemini models. EmbeddingGemma produces vector representations of text, making it well-suited for search and retrieval tasks, including classification, clustering, and semantic similarity search. This model was trained with data in 100+ spoken languages.",
@@ -8,51 +8,59 @@
88
"name": "Text Embeddings",
99
"description": "Feature extraction models transform raw data into numerical features that can be processed while preserving the information in the original dataset. These models are ideal as part of building vector search applications or Retrieval Augmented Generation workflows with Large Language Models (LLM)."
1010
},
11-
"created_at": "2025-09-03 20:48:38.784",
11+
"created_at": "2025-09-04 16:38:44.980",
1212
"tags": [],
1313
"properties": [],
1414
"schema": {
1515
"input": {
1616
"type": "object",
1717
"properties": {
1818
"text": {
19-
"oneOf": [{
20-
"type": "string"
21-
}, {
22-
"type": "array",
23-
"items": {
24-
"type": "string"
19+
"oneOf": [
20+
{
21+
"type": "string",
22+
"description": "The text to embed",
23+
"minLength": 1
24+
},
25+
{
26+
"type": "array",
27+
"description": "Batch of text values to embed",
28+
"items": {
29+
"type": "string",
30+
"description": "The text to embed",
31+
"minLength": 1
32+
},
33+
"maxItems": 100
2534
}
26-
}],
27-
"description": "Input text to embed. Can be a single string or a list of strings."
35+
]
2836
}
2937
},
30-
"required": ["text"]
38+
"required": [
39+
"text"
40+
]
3141
},
3242
"output": {
3343
"type": "object",
44+
"contentType": "application/json",
3445
"properties": {
46+
"shape": {
47+
"type": "array",
48+
"items": {
49+
"type": "number"
50+
}
51+
},
3552
"data": {
3653
"type": "array",
54+
"description": "Embeddings of the requested text values",
3755
"items": {
3856
"type": "array",
57+
"description": "Floating point embedding representation shaped by the embedding model",
3958
"items": {
4059
"type": "number"
4160
}
42-
},
43-
"description": "Embedding vectors, where each vector is a list of floats."
44-
},
45-
"shape": {
46-
"type": "array",
47-
"items": {
48-
"type": "integer"
49-
},
50-
"minItems": 2,
51-
"maxItems": 2,
52-
"description": "Shape of the embedding data as [number_of_embeddings, embedding_dimension]."
61+
}
5362
}
54-
},
55-
"required": ["data", "shape"]
63+
}
5664
}
5765
}
5866
}

src/content/workers-ai-models/flux.json

Lines changed: 116 additions & 116 deletions
Original file line numberDiff line numberDiff line change
@@ -21,126 +21,126 @@
2121
}
2222
],
2323
"schema": {
24-
"input": {
25-
"type": "object",
26-
"properties": {
27-
"encoding": {
28-
"type": "string",
29-
"description": "Encoding of the audio stream. Currently only supports raw signed little-endian 16-bit PCM.",
30-
"enum": [
31-
"linear16"
32-
]
33-
},
34-
"sample_rate": {
35-
"type": "string",
36-
"description": "Sample rate of the audio stream in Hz.",
37-
"pattern": "^[0-9]+$"
38-
},
39-
"eager_eot_threshold": {
40-
"type": "string",
41-
"description": "End-of-turn confidence required to fire an eager end-of-turn event. When set, enables EagerEndOfTurn and TurnResumed events. Valid Values 0.3 - 0.9."
42-
},
43-
"eot_threshold": {
44-
"type": "string",
45-
"description": "End-of-turn confidence required to finish a turn. Valid Values 0.5 - 0.9.",
46-
"default": "0.7"
47-
},
48-
"eot_timeout_ms": {
49-
"type": "string",
50-
"description": "A turn will be finished when this much time has passed after speech, regardless of EOT confidence.",
51-
"default": "5000",
52-
"pattern": "^[0-9]+$"
53-
},
54-
"keyterm": {
55-
"type": "string",
56-
"description": "Keyterm prompting can improve recognition of specialized terminology. Pass multiple keyterm query parameters to boost multiple keyterms."
57-
},
58-
"mip_opt_out": {
59-
"type": "string",
60-
"description": "Opts out requests from the Deepgram Model Improvement Program. Refer to Deepgram Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip",
61-
"enum": [
62-
"true",
63-
"false"
64-
],
65-
"default": "false"
66-
},
67-
"tag": {
68-
"type": "string",
69-
"description": "Label your requests for the purpose of identification during usage reporting"
70-
},
71-
"required": [
72-
"sample_rate",
73-
"encoding"
74-
]
75-
}
76-
},
77-
"output": {
78-
"type": "object",
79-
"description": "Output will be returned as websocket messages.",
80-
"properties": {
81-
"request_id": {
82-
"type": "string",
83-
"description": "The unique identifier of the request (uuid)"
84-
},
85-
"sequence_id": {
86-
"type": "integer",
87-
"description": "Starts at 0 and increments for each message the server sends to the client.",
88-
"minimum": 0
89-
},
90-
"event": {
91-
"type": "string",
92-
"description": "The type of event being reported.",
93-
"enum": [
94-
"Update",
95-
"StartOfTurn",
96-
"EagerEndOfTurn",
97-
"TurnResumed",
98-
"EndOfTurn"
24+
"input": {
25+
"type": "object",
26+
"properties": {
27+
"encoding": {
28+
"type": "string",
29+
"description": "Encoding of the audio stream. Currently only supports raw signed little-endian 16-bit PCM.",
30+
"enum": [
31+
"linear16"
32+
]
33+
},
34+
"sample_rate": {
35+
"type": "string",
36+
"description": "Sample rate of the audio stream in Hz.",
37+
"pattern": "^[0-9]+$"
38+
},
39+
"eager_eot_threshold": {
40+
"type": "string",
41+
"description": "End-of-turn confidence required to fire an eager end-of-turn event. When set, enables EagerEndOfTurn and TurnResumed events. Valid Values 0.3 - 0.9."
42+
},
43+
"eot_threshold": {
44+
"type": "string",
45+
"description": "End-of-turn confidence required to finish a turn. Valid Values 0.5 - 0.9.",
46+
"default": "0.7"
47+
},
48+
"eot_timeout_ms": {
49+
"type": "string",
50+
"description": "A turn will be finished when this much time has passed after speech, regardless of EOT confidence.",
51+
"default": "5000",
52+
"pattern": "^[0-9]+$"
53+
},
54+
"keyterm": {
55+
"type": "string",
56+
"description": "Keyterm prompting can improve recognition of specialized terminology. Pass multiple keyterm query parameters to boost multiple keyterms."
57+
},
58+
"mip_opt_out": {
59+
"type": "string",
60+
"description": "Opts out requests from the Deepgram Model Improvement Program. Refer to Deepgram Docs for pricing impacts before setting this to true. https://dpgr.am/deepgram-mip",
61+
"enum": [
62+
"true",
63+
"false"
64+
],
65+
"default": "false"
66+
},
67+
"tag": {
68+
"type": "string",
69+
"description": "Label your requests for the purpose of identification during usage reporting"
70+
}
71+
},
72+
"required": [
73+
"sample_rate",
74+
"encoding"
9975
]
100-
},
101-
"turn_index": {
102-
"type": "integer",
103-
"description": "The index of the current turn",
104-
"minimum": 0
105-
},
106-
"audio_window_start": {
107-
"type": "number",
108-
"description": "Start time in seconds of the audio range that was transcribed"
109-
},
110-
"audio_window_end": {
111-
"type": "number",
112-
"description": "End time in seconds of the audio range that was transcribed"
113-
},
114-
"transcript": {
115-
"type": "string",
116-
"description": "Text that was said over the course of the current turn"
117-
},
118-
"words": {
119-
"type": "array",
120-
"description": "The words in the transcript",
121-
"items": {
122-
"type": "object",
123-
"required": [
124-
"word",
125-
"confidence"
126-
],
127-
"properties": {
128-
"word": {
129-
"type": "string",
130-
"description": "The individual punctuated, properly-cased word from the transcript"
76+
},
77+
"output": {
78+
"type": "object",
79+
"description": "Output will be returned as websocket messages.",
80+
"properties": {
81+
"request_id": {
82+
"type": "string",
83+
"description": "The unique identifier of the request (uuid)"
84+
},
85+
"sequence_id": {
86+
"type": "integer",
87+
"description": "Starts at 0 and increments for each message the server sends to the client.",
88+
"minimum": 0
89+
},
90+
"event": {
91+
"type": "string",
92+
"description": "The type of event being reported.",
93+
"enum": [
94+
"Update",
95+
"StartOfTurn",
96+
"EagerEndOfTurn",
97+
"TurnResumed",
98+
"EndOfTurn"
99+
]
100+
},
101+
"turn_index": {
102+
"type": "integer",
103+
"description": "The index of the current turn",
104+
"minimum": 0
105+
},
106+
"audio_window_start": {
107+
"type": "number",
108+
"description": "Start time in seconds of the audio range that was transcribed"
109+
},
110+
"audio_window_end": {
111+
"type": "number",
112+
"description": "End time in seconds of the audio range that was transcribed"
113+
},
114+
"transcript": {
115+
"type": "string",
116+
"description": "Text that was said over the course of the current turn"
117+
},
118+
"words": {
119+
"type": "array",
120+
"description": "The words in the transcript",
121+
"items": {
122+
"type": "object",
123+
"required": [
124+
"word",
125+
"confidence"
126+
],
127+
"properties": {
128+
"word": {
129+
"type": "string",
130+
"description": "The individual punctuated, properly-cased word from the transcript"
131+
},
132+
"confidence": {
133+
"type": "number",
134+
"description": "Confidence that this word was transcribed correctly"
135+
}
136+
}
137+
}
131138
},
132-
"confidence": {
133-
"type": "number",
134-
"description": "Confidence that this word was transcribed correctly"
139+
"end_of_turn_confidence": {
140+
"type": "number",
141+
"description": "Confidence that no more speech is coming in this turn"
135142
}
136-
}
137143
}
138-
},
139-
"end_of_turn_confidence": {
140-
"type": "number",
141-
"description": "Confidence that no more speech is coming in this turn"
142-
}
143144
}
144-
}
145145
}
146146
}

0 commit comments

Comments
 (0)