cloudflare
diff --git a/‎src/content/workers-ai-models/deepseek-coder-6.7b-base-awq.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/deepseek-coder-6.7b-base-awq.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/content/workers-ai-models/deepseek-coder-6.7b-instruct-awq.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/deepseek-coder-6.7b-instruct-awq.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/content/workers-ai-models/deepseek-math-7b-instruct.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/deepseek-math-7b-instruct.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/content/workers-ai-models/discolm-german-7b-v1-awq.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/discolm-german-7b-v1-awq.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/content/workers-ai-models/falcon-7b-instruct.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/falcon-7b-instruct.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/content/workers-ai-models/gemma-2b-it-lora.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/gemma-2b-it-lora.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/content/workers-ai-models/gemma-7b-it-lora.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/gemma-7b-it-lora.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/content/workers-ai-models/gemma-7b-it.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/gemma-7b-it.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/content/workers-ai-models/hermes-2-pro-mistral-7b.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/hermes-2-pro-mistral-7b.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/content/workers-ai-models/llama-2-13b-chat-awq.json‎
Lines changed: 21 additions & 0 deletions b/‎src/content/workers-ai-models/llama-2-13b-chat-awq.json‎
Lines changed: 21 additions & 0 deletions
@@ -353,6 +353,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",
 
@@ -353,6 +353,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",
 
@@ -357,6 +357,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",
 
@@ -353,6 +353,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",
 
@@ -353,6 +353,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",
 
@@ -353,6 +353,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",
 
@@ -353,6 +353,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",
 
@@ -373,6 +373,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",
 
@@ -357,6 +357,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",
 
@@ -353,6 +353,27 @@
                             "type": "string",
                             "description": "The generated text response from the model"
                         },
+                        "usage": {
+                            "type": "object",
+                            "description": "Usage statistics for the inference request",
+                            "properties": {
+                                "prompt_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in input",
+                                    "default": 0
+                                },
+                                "completion_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of tokens in output",
+                                    "default": 0
+                                },
+                                "total_tokens": {
+                                    "type": "number",
+                                    "description": "Total number of input and output tokens",
+                                    "default": 0
+                                }
+                            }
+                        },
                         "tool_calls": {
                             "type": "array",
                             "description": "An array of tool calls requests made during the response generation",