Update bindings.mdx

thomasgauvin · web-flow · commit b2fc8e22f932 · 2025-01-18T15:27:53.000-05:00
diff --git a/src/content/docs/workers-ai/configuration/bindings.mdx b/src/content/docs/workers-ai/configuration/bindings.mdx
@@ -55,9 +55,57 @@ const answer = await env.AI.run('@cf/meta/llama-3.1-8b-instruct', {
 
   **Supported options**
 
+  * `prompt` <Type text="string" /> <MetaInfo text="optional" />
+    * Text prompt for the text-generation (maxLength: 131072, minLength: 1).
+  * `raw` <Type text="boolean" /> <MetaInfo text="optional" />
+    * If true, a chat template is not applied and you must adhere to the specific model's expected formatting.
   * `stream` <Type text="boolean" /> <MetaInfo text="optional" />
-    * Returns a stream of results as they are available.
-
+    * If true, the response will be streamed back incrementally using SSE, Server Sent Events.
+  * `max_tokens` <Type text="number" /> <MetaInfo text="optional" />
+    * The maximum number of tokens to generate in the response.
+  * `temperature` <Type text="number" /> <MetaInfo text="optional" />
+    * Controls the randomness of the output; higher values produce more random results (maximum: 5, minimum: 0).
+  * `top_p` <Type text="number" /> <MetaInfo text="optional" />
+    * Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses (maximum: 2, minimum: 0).
+  * `top_k` <Type text="number" /> <MetaInfo text="optional" />
+    * Limits the AI to choose from the top 'k' most probable words. Lower values make responses more focused; higher values introduce more variety and potential surprises (maximum: 50, minimum: 1).
+  * `seed` <Type text="number" /> <MetaInfo text="optional" />
+    * Random seed for reproducibility of the generation (maximum: 9999999999, minimum: 1).
+  * `repetition_penalty` <Type text="number" /> <MetaInfo text="optional" />
+    * Penalty for repeated tokens; higher values discourage repetition (maximum: 2, minimum: 0). 
+  * `frequency_penalty` <Type text="number" /> <MetaInfo text="optional" />
+    * Decreases the likelihood of the model repeating the same lines verbatim (maximum: 2, minimum: 0).
+  * `presence_penalty` <Type text="number" /> <MetaInfo text="optional" />
+    * Increases the likelihood of the model introducing new topics (maximum: 2, minimum: 0).
+  * `messages` <Type text="{
+  role: "user" | "assistant" | "system" | "tool" | (string & NonNullable<unknown>);
+  content: string;
+  name?: string;
+}[]" /> <MetaInfo text="optional" />
+    * An array of message objects representing the conversation history.
+  * `tools` <Type text="{
+  type: "function" | (string & NonNullable<unknown>);
+  function: {
+    name: string;
+    description: string;
+    parameters?: {
+      type: "object" | (string & NonNullable<unknown>);
+      properties: {
+        [key: string]: {
+          type: string;
+          description?: string;
+        };
+      };
+      required: string[];
+    };
+  };
+}[]" /> <MetaInfo text="optional" />
+    * A list of tools available for the assistant to use.
+  * `functions` <Type text="{
+  name: string;
+  code: string;
+}[]" /> <MetaInfo text="optional" />
+    * A list of functions available for the assistant to use.
 
 
 ```javascript