|
11 | 11 | "created_at": "2024-12-06 17:09:18.338", |
12 | 12 | "tags": [], |
13 | 13 | "properties": [ |
| 14 | + { |
| 15 | + "property_id": "async_queue", |
| 16 | + "value": "true" |
| 17 | + }, |
14 | 18 | { |
15 | 19 | "property_id": "context_window", |
16 | 20 | "value": "24000" |
|
30 | 34 | } |
31 | 35 | ] |
32 | 36 | }, |
| 37 | + { |
| 38 | + "property_id": "function_calling", |
| 39 | + "value": "true" |
| 40 | + }, |
| 41 | + { |
| 42 | + "property_id": "lora", |
| 43 | + "value": "true" |
| 44 | + }, |
33 | 45 | { |
34 | 46 | "property_id": "terms", |
35 | 47 | "value": "https://github.com/meta-llama/llama-models/blob/main/models/llama3_3/LICENSE" |
|
53 | 65 | }, |
54 | 66 | "response_format": { |
55 | 67 | "title": "JSON Mode", |
56 | | - "type": "object", |
57 | 68 | "properties": { |
58 | 69 | "type": { |
59 | 70 | "type": "string", |
|
65 | 76 | "json_schema": {} |
66 | 77 | } |
67 | 78 | }, |
| 79 | + "guided_json": { |
| 80 | + "type": "object", |
| 81 | + "description": "JSON schema that should be fulfilled for the response." |
| 82 | + }, |
68 | 83 | "raw": { |
69 | 84 | "type": "boolean", |
70 | 85 | "default": false, |
|
82 | 97 | }, |
83 | 98 | "temperature": { |
84 | 99 | "type": "number", |
85 | | - "default": 0.6, |
| 100 | + "default": 0.15, |
86 | 101 | "minimum": 0, |
87 | 102 | "maximum": 5, |
88 | 103 | "description": "Controls the randomness of the output; higher values produce more random results." |
|
141 | 156 | "type": "string", |
142 | 157 | "description": "The role of the message sender (e.g., 'user', 'assistant', 'system', 'tool')." |
143 | 158 | }, |
144 | | - "content": { |
| 159 | + "tool_call_id": { |
145 | 160 | "type": "string", |
146 | | - "description": "The content of the message as a string." |
| 161 | + "description": "The tool call id. Must be supplied for tool calls for Mistral-3. If you don't know what to put here you can fall back to 000000001", |
| 162 | + "pattern": "[a-zA-Z0-9]{9}" |
| 163 | + }, |
| 164 | + "content": { |
| 165 | + "oneOf": [ |
| 166 | + { |
| 167 | + "type": "string", |
| 168 | + "description": "The content of the message as a string." |
| 169 | + }, |
| 170 | + { |
| 171 | + "type": "array", |
| 172 | + "items": { |
| 173 | + "type": "object", |
| 174 | + "properties": { |
| 175 | + "type": { |
| 176 | + "type": "string", |
| 177 | + "description": "Type of the content provided" |
| 178 | + }, |
| 179 | + "text": { |
| 180 | + "type": "string" |
| 181 | + }, |
| 182 | + "image_url": { |
| 183 | + "type": "object", |
| 184 | + "properties": { |
| 185 | + "url": { |
| 186 | + "type": "string", |
| 187 | + "pattern": "^data:*", |
| 188 | + "description": "image uri with data (e.g. ...). HTTP URL will not be accepted" |
| 189 | + } |
| 190 | + } |
| 191 | + } |
| 192 | + } |
| 193 | + } |
| 194 | + }, |
| 195 | + { |
| 196 | + "type": "object", |
| 197 | + "properties": { |
| 198 | + "type": { |
| 199 | + "type": "string", |
| 200 | + "description": "Type of the content provided" |
| 201 | + }, |
| 202 | + "text": { |
| 203 | + "type": "string" |
| 204 | + }, |
| 205 | + "image_url": { |
| 206 | + "type": "object", |
| 207 | + "properties": { |
| 208 | + "url": { |
| 209 | + "type": "string", |
| 210 | + "pattern": "^data:*", |
| 211 | + "description": "image uri with data (e.g. ...). HTTP URL will not be accepted" |
| 212 | + } |
| 213 | + } |
| 214 | + } |
| 215 | + } |
| 216 | + } |
| 217 | + ] |
147 | 218 | } |
148 | | - }, |
149 | | - "required": [ |
150 | | - "role", |
151 | | - "content" |
152 | | - ] |
| 219 | + } |
153 | 220 | } |
154 | 221 | }, |
155 | 222 | "functions": { |
|
313 | 380 | }, |
314 | 381 | "response_format": { |
315 | 382 | "title": "JSON Mode", |
316 | | - "type": "object", |
317 | 383 | "properties": { |
318 | 384 | "type": { |
319 | 385 | "type": "string", |
|
325 | 391 | "json_schema": {} |
326 | 392 | } |
327 | 393 | }, |
| 394 | + "guided_json": { |
| 395 | + "type": "object", |
| 396 | + "description": "JSON schema that should be fufilled for the response." |
| 397 | + }, |
328 | 398 | "raw": { |
329 | 399 | "type": "boolean", |
330 | 400 | "default": false, |
|
342 | 412 | }, |
343 | 413 | "temperature": { |
344 | 414 | "type": "number", |
345 | | - "default": 0.6, |
| 415 | + "default": 0.15, |
346 | 416 | "minimum": 0, |
347 | 417 | "maximum": 5, |
348 | 418 | "description": "Controls the randomness of the output; higher values produce more random results." |
|
387 | 457 | "required": [ |
388 | 458 | "messages" |
389 | 459 | ] |
| 460 | + }, |
| 461 | + { |
| 462 | + "type": "object", |
| 463 | + "properties": { |
| 464 | + "requests": { |
| 465 | + "type": "array", |
| 466 | + "items": { |
| 467 | + "type": "object", |
| 468 | + "properties": { |
| 469 | + "external_reference": { |
| 470 | + "type": "string", |
| 471 | + "description": "User-supplied reference. This field will be present in the response as well it can be used to reference the request and response. It's NOT validated to be unique." |
| 472 | + }, |
| 473 | + "prompt": { |
| 474 | + "type": "string", |
| 475 | + "minLength": 1, |
| 476 | + "description": "Prompt for the text generation model" |
| 477 | + }, |
| 478 | + "stream": { |
| 479 | + "type": "boolean", |
| 480 | + "default": false, |
| 481 | + "description": "If true, the response will be streamed back incrementally using SSE, Server Sent Events." |
| 482 | + }, |
| 483 | + "max_tokens": { |
| 484 | + "type": "integer", |
| 485 | + "default": 256, |
| 486 | + "description": "The maximum number of tokens to generate in the response." |
| 487 | + }, |
| 488 | + "temperature": { |
| 489 | + "type": "number", |
| 490 | + "default": 0.6, |
| 491 | + "minimum": 0, |
| 492 | + "maximum": 5, |
| 493 | + "description": "Controls the randomness of the output; higher values produce more random results." |
| 494 | + }, |
| 495 | + "top_p": { |
| 496 | + "type": "number", |
| 497 | + "minimum": 0, |
| 498 | + "maximum": 2, |
| 499 | + "description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses." |
| 500 | + }, |
| 501 | + "seed": { |
| 502 | + "type": "integer", |
| 503 | + "minimum": 1, |
| 504 | + "maximum": 9999999999, |
| 505 | + "description": "Random seed for reproducibility of the generation." |
| 506 | + }, |
| 507 | + "repetition_penalty": { |
| 508 | + "type": "number", |
| 509 | + "minimum": 0, |
| 510 | + "maximum": 2, |
| 511 | + "description": "Penalty for repeated tokens; higher values discourage repetition." |
| 512 | + }, |
| 513 | + "frequency_penalty": { |
| 514 | + "type": "number", |
| 515 | + "minimum": 0, |
| 516 | + "maximum": 2, |
| 517 | + "description": "Decreases the likelihood of the model repeating the same lines verbatim." |
| 518 | + }, |
| 519 | + "presence_penalty": { |
| 520 | + "type": "number", |
| 521 | + "minimum": 0, |
| 522 | + "maximum": 2, |
| 523 | + "description": "Increases the likelihood of the model introducing new topics." |
| 524 | + }, |
| 525 | + "response_format": { |
| 526 | + "title": "JSON Mode", |
| 527 | + "type": "object", |
| 528 | + "properties": { |
| 529 | + "type": { |
| 530 | + "type": "string", |
| 531 | + "enum": [ |
| 532 | + "json_object", |
| 533 | + "json_schema" |
| 534 | + ] |
| 535 | + }, |
| 536 | + "json_schema": {} |
| 537 | + } |
| 538 | + } |
| 539 | + } |
| 540 | + } |
| 541 | + } |
| 542 | + }, |
| 543 | + "required": [ |
| 544 | + "requests" |
| 545 | + ] |
390 | 546 | } |
391 | 547 | ] |
392 | 548 | }, |
393 | 549 | "output": { |
394 | 550 | "oneOf": [ |
395 | 551 | { |
396 | 552 | "type": "object", |
| 553 | + "contentType": "application/json", |
397 | 554 | "properties": { |
398 | 555 | "response": { |
399 | 556 | "type": "string", |
|
444 | 601 | }, |
445 | 602 | { |
446 | 603 | "type": "string", |
| 604 | + "contentType": "text/event-stream", |
447 | 605 | "format": "binary" |
| 606 | + }, |
| 607 | + { |
| 608 | + "type": "object", |
| 609 | + "contentType": "application/json", |
| 610 | + "title": "Async response", |
| 611 | + "properties": { |
| 612 | + "request_id": { |
| 613 | + "type": "string", |
| 614 | + "description": "The async request id that can be used to obtain the results." |
| 615 | + } |
| 616 | + } |
448 | 617 | } |
449 | 618 | ] |
450 | 619 | } |
|
0 commit comments