new models and pricing page

mchenco · mchenco · commit b962301d9d6c · 2025-03-17T14:53:45.000-04:00
diff --git a/src/content/docs/workers-ai/platform/pricing.mdx b/src/content/docs/workers-ai/platform/pricing.mdx
@@ -55,6 +55,10 @@ Neurons are our way of measuring AI outputs across different models, representin
 | @cf/baai/bge-small-en-v1.5            | $0.020 per M input tokens                                  | 1841 neurons per M input tokens                                          |
 | @cf/baai/bge-base-en-v1.5             | $0.067 per M input tokens                                  | 6058 neurons per M input tokens                                          |
 | @cf/baai/bge-large-en-v1.5            | $0.204 per M input tokens                                  | 18582 neurons per M input tokens                                         |
+|@cf/baai/bge-m3                  |$0.012 per M input tokens|1075 neurons per M input tokens  |
+|@cf/baai/bge-reranker-base       |$0.003 per M input tokens|283 neurons per M input tokens   |
 | @cf/meta/m2m100-1.2b                  | $0.342 per M input tokens <br/> $0.342 per M output tokens | 31050 neurons per M input tokens <br/> 31050 neurons per M output tokens |
 | @cf/microsoft/resnet-50               | $2.51 per M images                                         | 228055 neurons per M images                                              |
 | @cf/openai/whisper                    | $0.0005 per audio minute                                   | 41.14 neurons per audio minute                                           |
+|@cf/openai/whisper-large-v3-turbo|$0.0005 per audio minute |46.63 neurons per audio minute   |
+|@cf/myshell-ai/melotts           |$3.416 per M input tokens|310577 neurons per M input tokens|
diff --git a/src/content/workers-ai-models/bge-m3.json b/src/content/workers-ai-models/bge-m3.json
@@ -0,0 +1,14 @@
+{
+    "id": "eed32bc1-8775-4985-89ce-dd1405508ad8",
+    "source": 1,
+    "name": "@cf/baai/bge-m3",
+    "description": "Multi-Functionality, Multi-Linguality, and Multi-Granularity embeddings model.",
+    "task": {
+        "id": "0137cdcf-162a-4108-94f2-1ca59e8c65ee",
+        "name": "Text Embeddings",
+        "description": "Feature extraction models transform raw data into numerical features that can be processed while preserving the information in the original dataset. These models are ideal as part of building vector search applications or Retrieval Augmented Generation workflows with Large Language Models (LLM)."
+    },
+    "tags": [],
+    "properties": [],
+    "schema": {}
+}
diff --git a/src/content/workers-ai-models/bge-reranker-base.json b/src/content/workers-ai-models/bge-reranker-base.json
@@ -0,0 +1,14 @@
+{
+    "id": "145337e7-cec3-4ebb-8e78-16ddfc75e580",
+    "source": 1,
+    "name": "@cf/baai/bge-reranker-base",
+    "description": "Different from embedding model, reranker uses question and document as input and directly output similarity instead of embedding. You can get a relevance score by inputting query and passage to the reranker. And the score can be mapped to a float value in [0,1] by sigmoid function.\n\n",
+    "task": {
+        "id": "19606750-23ed-4371-aab2-c20349b53a60",
+        "name": "Text Classification",
+        "description": "Sentiment analysis or text classification is a common NLP task that classifies a text input into labels or classes."
+    },
+    "tags": [],
+    "properties": [],
+    "schema": {}
+}
diff --git a/src/content/workers-ai-models/llama-3.2-1b-instruct.json b/src/content/workers-ai-models/llama-3.2-1b-instruct.json
@@ -12,7 +12,7 @@
     "properties": [
         {
             "property_id": "context_window",
-            "value": "128000"
+            "value": "60000"
         },
         {
             "property_id": "terms",
diff --git a/src/content/workers-ai-models/llama-guard-3-8b.json b/src/content/workers-ai-models/llama-guard-3-8b.json
@@ -21,12 +21,14 @@
                         "type": "object",
                         "properties": {
                             "role": {
-                                "type": "string",
-                                "description": "The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool')."
+                                "enum": [
+                                    "user",
+                                    "assistant"
+                                ],
+                                "description": "The role of the message sender must alternate between 'user' and 'assistant'."
                             },
                             "content": {
                                 "type": "string",
-                                "maxLength": 131072,
                                 "description": "The content of the message as a string."
                             }
                         },
diff --git a/src/content/workers-ai-models/whisper-large-v3-turbo.json b/src/content/workers-ai-models/whisper-large-v3-turbo.json
@@ -9,12 +9,7 @@
         "description": "Automatic speech recognition (ASR) models convert a speech signal, typically an audio input, to text."
     },
     "tags": [],
-    "properties": [
-        {
-            "property_id": "beta",
-            "value": "true"
-        }
-    ],
+    "properties": [],
     "schema": {
         "input": {
             "type": "object",
@@ -44,7 +39,7 @@
                 },
                 "prefix": {
                     "type": "string",
-                    "description": "The prefix it appended the beginning of the output of the transcription and can guide the transcription result."
+                    "description": "The prefix it appended the the beginning of the output of the transcription and can guide the transcription result."
                 }
             },
             "required": [
@@ -85,52 +80,55 @@
                     "description": "The total number of words in the transcription."
                 },
                 "segments": {
-                    "type": "object",
-                    "properties": {
-                        "start": {
-                            "type": "number",
-                            "description": "The starting time of the segment within the audio, in seconds."
-                        },
-                        "end": {
-                            "type": "number",
-                            "description": "The ending time of the segment within the audio, in seconds."
-                        },
-                        "text": {
-                            "type": "string",
-                            "description": "The transcription of the segment."
-                        },
-                        "temperature": {
-                            "type": "number",
-                            "description": "The temperature used in the decoding process, controlling randomness in predictions. Lower values result in more deterministic outputs."
-                        },
-                        "avg_logprob": {
-                            "type": "number",
-                            "description": "The average log probability of the predictions for the words in this segment, indicating overall confidence."
-                        },
-                        "compression_ratio": {
-                            "type": "number",
-                            "description": "The compression ratio of the input to the output, measuring how much the text was compressed during the transcription process."
-                        },
-                        "no_speech_prob": {
-                            "type": "number",
-                            "description": "The probability that the segment contains no speech, represented as a decimal between 0 and 1."
-                        },
-                        "words": {
-                            "type": "array",
-                            "items": {
-                                "type": "object",
-                                "properties": {
-                                    "word": {
-                                        "type": "string",
-                                        "description": "The individual word transcribed from the audio."
-                                    },
-                                    "start": {
-                                        "type": "number",
-                                        "description": "The starting time of the word within the audio, in seconds."
-                                    },
-                                    "end": {
-                                        "type": "number",
-                                        "description": "The ending time of the word within the audio, in seconds."
+                    "type": "array",
+                    "items": {
+                        "type": "object",
+                        "properties": {
+                            "start": {
+                                "type": "number",
+                                "description": "The starting time of the segment within the audio, in seconds."
+                            },
+                            "end": {
+                                "type": "number",
+                                "description": "The ending time of the segment within the audio, in seconds."
+                            },
+                            "text": {
+                                "type": "string",
+                                "description": "The transcription of the segment."
+                            },
+                            "temperature": {
+                                "type": "number",
+                                "description": "The temperature used in the decoding process, controlling randomness in predictions. Lower values result in more deterministic outputs."
+                            },
+                            "avg_logprob": {
+                                "type": "number",
+                                "description": "The average log probability of the predictions for the words in this segment, indicating overall confidence."
+                            },
+                            "compression_ratio": {
+                                "type": "number",
+                                "description": "The compression ratio of the input to the output, measuring how much the text was compressed during the transcription process."
+                            },
+                            "no_speech_prob": {
+                                "type": "number",
+                                "description": "The probability that the segment contains no speech, represented as a decimal between 0 and 1."
+                            },
+                            "words": {
+                                "type": "array",
+                                "items": {
+                                    "type": "object",
+                                    "properties": {
+                                        "word": {
+                                            "type": "string",
+                                            "description": "The individual word transcribed from the audio."
+                                        },
+                                        "start": {
+                                            "type": "number",
+                                            "description": "The starting time of the word within the audio, in seconds."
+                                        },
+                                        "end": {
+                                            "type": "number",
+                                            "description": "The ending time of the word within the audio, in seconds."
+                                        }
                                     }
                                 }
                             }

Original file line number	Diff line number	Diff line change
`@@ -12,7 +12,7 @@`
`12`	`12`	`"properties": [`
`13`	`13`	`{`
`14`	`14`	`"property_id": "context_window",`
`15`		`- "value": "128000"`
	`15`	`+ "value": "60000"`
`16`	`16`	`},`
`17`	`17`	`{`
`18`	`18`	`"property_id": "terms",`