diff --git a/src/content/workers-ai-models/falcon-7b-instruct.json b/src/content/workers-ai-models/falcon-7b-instruct.json index 1bfd7a84753d660..db373d9e1e4e84b 100644 --- a/src/content/workers-ai-models/falcon-7b-instruct.json +++ b/src/content/workers-ai-models/falcon-7b-instruct.json @@ -78,8 +78,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -102,13 +102,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } @@ -338,8 +338,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -362,13 +362,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } diff --git a/src/content/workers-ai-models/gemma-7b-it-lora.json b/src/content/workers-ai-models/gemma-7b-it-lora.json index 2a30cda85aa955d..f8858fa2cbe5368 100644 --- a/src/content/workers-ai-models/gemma-7b-it-lora.json +++ b/src/content/workers-ai-models/gemma-7b-it-lora.json @@ -78,8 +78,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -102,13 +102,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } @@ -338,8 +338,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -362,13 +362,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } diff --git a/src/content/workers-ai-models/hermes-2-pro-mistral-7b.json b/src/content/workers-ai-models/hermes-2-pro-mistral-7b.json index 9ec4c47011678ab..9a2ec4100f9c27c 100644 --- a/src/content/workers-ai-models/hermes-2-pro-mistral-7b.json +++ b/src/content/workers-ai-models/hermes-2-pro-mistral-7b.json @@ -82,8 +82,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -106,13 +106,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } @@ -342,8 +342,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -366,13 +366,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } diff --git a/src/content/workers-ai-models/llama-3.1-8b-instruct-fp8.json b/src/content/workers-ai-models/llama-3.1-8b-instruct-fp8.json index 8b0c68c21b0d420..d7f3a268edef747 100644 --- a/src/content/workers-ai-models/llama-3.1-8b-instruct-fp8.json +++ b/src/content/workers-ai-models/llama-3.1-8b-instruct-fp8.json @@ -89,8 +89,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -113,13 +113,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } @@ -349,8 +349,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -373,13 +373,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } diff --git a/src/content/workers-ai-models/llama-4-scout-17b-16e-instruct.json b/src/content/workers-ai-models/llama-4-scout-17b-16e-instruct.json index c02a03c1aeddd3f..b7935e245d93ea5 100644 --- a/src/content/workers-ai-models/llama-4-scout-17b-16e-instruct.json +++ b/src/content/workers-ai-models/llama-4-scout-17b-16e-instruct.json @@ -487,13 +487,27 @@ "items": { "type": "object", "properties": { - "arguments": { - "type": "object", - "description": "The arguments passed to be passed to the tool call request" + "id": { + "type": "string", + "description": "The tool call id." }, - "name": { + "type": { "type": "string", - "description": "The name of the tool to be called" + "description": "Specifies the type of tool (e.g., 'function')." + }, + "function": { + "type": "object", + "description": "Details of the function tool.", + "properties": { + "name": { + "type": "string", + "description": "The name of the tool to be called" + }, + "arguments": { + "type": "object", + "description": "The arguments passed to be passed to the tool call request" + } + } } } } diff --git a/src/content/workers-ai-models/llava-1.5-7b-hf.json b/src/content/workers-ai-models/llava-1.5-7b-hf.json index 6547708f60747b6..ac627be9905e961 100644 --- a/src/content/workers-ai-models/llava-1.5-7b-hf.json +++ b/src/content/workers-ai-models/llava-1.5-7b-hf.json @@ -27,6 +27,23 @@ { "type": "object", "properties": { + "image": { + "oneOf": [ + { + "type": "array", + "description": "An array of integers that represent the image data constrained to 8-bit unsigned integer values", + "items": { + "type": "number", + "description": "A value between 0 and 255" + } + }, + { + "type": "string", + "format": "binary", + "description": "Binary string representing the image contents." + } + ] + }, "temperature": { "type": "number", "description": "Controls the randomness of the output; higher values produce more random results." @@ -64,23 +81,6 @@ "type": "number", "description": "Increases the likelihood of the model introducing new topics." }, - "image": { - "oneOf": [ - { - "type": "array", - "description": "An array of integers that represent the image data constrained to 8-bit unsigned integer values", - "items": { - "type": "number", - "description": "A value between 0 and 255" - } - }, - { - "type": "string", - "format": "binary", - "description": "Binary string representing the image contents." - } - ] - }, "max_tokens": { "type": "integer", "default": 512, diff --git a/src/content/workers-ai-models/meta-llama-3-8b-instruct.json b/src/content/workers-ai-models/meta-llama-3-8b-instruct.json index 49640a8463fc4c9..3f4111feb172bae 100644 --- a/src/content/workers-ai-models/meta-llama-3-8b-instruct.json +++ b/src/content/workers-ai-models/meta-llama-3-8b-instruct.json @@ -70,8 +70,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -94,13 +94,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } @@ -330,8 +330,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -354,13 +354,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } diff --git a/src/content/workers-ai-models/neural-chat-7b-v3-1-awq.json b/src/content/workers-ai-models/neural-chat-7b-v3-1-awq.json index dd292029d48b9ae..37eca190cdf7610 100644 --- a/src/content/workers-ai-models/neural-chat-7b-v3-1-awq.json +++ b/src/content/workers-ai-models/neural-chat-7b-v3-1-awq.json @@ -74,8 +74,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -98,13 +98,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } @@ -334,8 +334,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -358,13 +358,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } diff --git a/src/content/workers-ai-models/starling-lm-7b-beta.json b/src/content/workers-ai-models/starling-lm-7b-beta.json index aaa9a30baa43d96..7c27f83a3213862 100644 --- a/src/content/workers-ai-models/starling-lm-7b-beta.json +++ b/src/content/workers-ai-models/starling-lm-7b-beta.json @@ -90,8 +90,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -114,13 +114,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } @@ -350,8 +350,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -374,13 +374,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } diff --git a/src/content/workers-ai-models/una-cybertron-7b-v2-bf16.json b/src/content/workers-ai-models/una-cybertron-7b-v2-bf16.json index ff07059d568a74a..d112df35440f07d 100644 --- a/src/content/workers-ai-models/una-cybertron-7b-v2-bf16.json +++ b/src/content/workers-ai-models/una-cybertron-7b-v2-bf16.json @@ -74,8 +74,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -98,13 +98,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } @@ -334,8 +334,8 @@ }, "top_p": { "type": "number", - "minimum": 0, - "maximum": 2, + "minimum": 0.001, + "maximum": 1, "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." }, "top_k": { @@ -358,13 +358,13 @@ }, "frequency_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Decreases the likelihood of the model repeating the same lines verbatim." }, "presence_penalty": { "type": "number", - "minimum": 0, + "minimum": -2, "maximum": 2, "description": "Increases the likelihood of the model introducing new topics." } diff --git a/src/content/workers-ai-models/whisper-large-v3-turbo.json b/src/content/workers-ai-models/whisper-large-v3-turbo.json index d440851ed2ef149..ed901fe3c8a210f 100644 --- a/src/content/workers-ai-models/whisper-large-v3-turbo.json +++ b/src/content/workers-ai-models/whisper-large-v3-turbo.json @@ -37,7 +37,6 @@ }, "language": { "type": "string", - "default": "en", "description": "The language of the audio being transcribed or translated." }, "vad_filter": {