Skip to content

Commit 8759297

Browse files
authored
[Workers AI] Model updates (#23079)
1 parent a960a3a commit 8759297

11 files changed

+100
-87
lines changed

src/content/workers-ai-models/falcon-7b-instruct.json

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -78,8 +78,8 @@
7878
},
7979
"top_p": {
8080
"type": "number",
81-
"minimum": 0,
82-
"maximum": 2,
81+
"minimum": 0.001,
82+
"maximum": 1,
8383
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
8484
},
8585
"top_k": {
@@ -102,13 +102,13 @@
102102
},
103103
"frequency_penalty": {
104104
"type": "number",
105-
"minimum": 0,
105+
"minimum": -2,
106106
"maximum": 2,
107107
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
108108
},
109109
"presence_penalty": {
110110
"type": "number",
111-
"minimum": 0,
111+
"minimum": -2,
112112
"maximum": 2,
113113
"description": "Increases the likelihood of the model introducing new topics."
114114
}
@@ -338,8 +338,8 @@
338338
},
339339
"top_p": {
340340
"type": "number",
341-
"minimum": 0,
342-
"maximum": 2,
341+
"minimum": 0.001,
342+
"maximum": 1,
343343
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
344344
},
345345
"top_k": {
@@ -362,13 +362,13 @@
362362
},
363363
"frequency_penalty": {
364364
"type": "number",
365-
"minimum": 0,
365+
"minimum": -2,
366366
"maximum": 2,
367367
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
368368
},
369369
"presence_penalty": {
370370
"type": "number",
371-
"minimum": 0,
371+
"minimum": -2,
372372
"maximum": 2,
373373
"description": "Increases the likelihood of the model introducing new topics."
374374
}

src/content/workers-ai-models/gemma-7b-it-lora.json

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -78,8 +78,8 @@
7878
},
7979
"top_p": {
8080
"type": "number",
81-
"minimum": 0,
82-
"maximum": 2,
81+
"minimum": 0.001,
82+
"maximum": 1,
8383
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
8484
},
8585
"top_k": {
@@ -102,13 +102,13 @@
102102
},
103103
"frequency_penalty": {
104104
"type": "number",
105-
"minimum": 0,
105+
"minimum": -2,
106106
"maximum": 2,
107107
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
108108
},
109109
"presence_penalty": {
110110
"type": "number",
111-
"minimum": 0,
111+
"minimum": -2,
112112
"maximum": 2,
113113
"description": "Increases the likelihood of the model introducing new topics."
114114
}
@@ -338,8 +338,8 @@
338338
},
339339
"top_p": {
340340
"type": "number",
341-
"minimum": 0,
342-
"maximum": 2,
341+
"minimum": 0.001,
342+
"maximum": 1,
343343
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
344344
},
345345
"top_k": {
@@ -362,13 +362,13 @@
362362
},
363363
"frequency_penalty": {
364364
"type": "number",
365-
"minimum": 0,
365+
"minimum": -2,
366366
"maximum": 2,
367367
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
368368
},
369369
"presence_penalty": {
370370
"type": "number",
371-
"minimum": 0,
371+
"minimum": -2,
372372
"maximum": 2,
373373
"description": "Increases the likelihood of the model introducing new topics."
374374
}

src/content/workers-ai-models/hermes-2-pro-mistral-7b.json

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -82,8 +82,8 @@
8282
},
8383
"top_p": {
8484
"type": "number",
85-
"minimum": 0,
86-
"maximum": 2,
85+
"minimum": 0.001,
86+
"maximum": 1,
8787
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
8888
},
8989
"top_k": {
@@ -106,13 +106,13 @@
106106
},
107107
"frequency_penalty": {
108108
"type": "number",
109-
"minimum": 0,
109+
"minimum": -2,
110110
"maximum": 2,
111111
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
112112
},
113113
"presence_penalty": {
114114
"type": "number",
115-
"minimum": 0,
115+
"minimum": -2,
116116
"maximum": 2,
117117
"description": "Increases the likelihood of the model introducing new topics."
118118
}
@@ -342,8 +342,8 @@
342342
},
343343
"top_p": {
344344
"type": "number",
345-
"minimum": 0,
346-
"maximum": 2,
345+
"minimum": 0.001,
346+
"maximum": 1,
347347
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
348348
},
349349
"top_k": {
@@ -366,13 +366,13 @@
366366
},
367367
"frequency_penalty": {
368368
"type": "number",
369-
"minimum": 0,
369+
"minimum": -2,
370370
"maximum": 2,
371371
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
372372
},
373373
"presence_penalty": {
374374
"type": "number",
375-
"minimum": 0,
375+
"minimum": -2,
376376
"maximum": 2,
377377
"description": "Increases the likelihood of the model introducing new topics."
378378
}

src/content/workers-ai-models/llama-3.1-8b-instruct-fp8.json

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -89,8 +89,8 @@
8989
},
9090
"top_p": {
9191
"type": "number",
92-
"minimum": 0,
93-
"maximum": 2,
92+
"minimum": 0.001,
93+
"maximum": 1,
9494
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
9595
},
9696
"top_k": {
@@ -113,13 +113,13 @@
113113
},
114114
"frequency_penalty": {
115115
"type": "number",
116-
"minimum": 0,
116+
"minimum": -2,
117117
"maximum": 2,
118118
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
119119
},
120120
"presence_penalty": {
121121
"type": "number",
122-
"minimum": 0,
122+
"minimum": -2,
123123
"maximum": 2,
124124
"description": "Increases the likelihood of the model introducing new topics."
125125
}
@@ -349,8 +349,8 @@
349349
},
350350
"top_p": {
351351
"type": "number",
352-
"minimum": 0,
353-
"maximum": 2,
352+
"minimum": 0.001,
353+
"maximum": 1,
354354
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
355355
},
356356
"top_k": {
@@ -373,13 +373,13 @@
373373
},
374374
"frequency_penalty": {
375375
"type": "number",
376-
"minimum": 0,
376+
"minimum": -2,
377377
"maximum": 2,
378378
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
379379
},
380380
"presence_penalty": {
381381
"type": "number",
382-
"minimum": 0,
382+
"minimum": -2,
383383
"maximum": 2,
384384
"description": "Increases the likelihood of the model introducing new topics."
385385
}

src/content/workers-ai-models/llama-4-scout-17b-16e-instruct.json

Lines changed: 19 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -487,13 +487,27 @@
487487
"items": {
488488
"type": "object",
489489
"properties": {
490-
"arguments": {
491-
"type": "object",
492-
"description": "The arguments passed to be passed to the tool call request"
490+
"id": {
491+
"type": "string",
492+
"description": "The tool call id."
493493
},
494-
"name": {
494+
"type": {
495495
"type": "string",
496-
"description": "The name of the tool to be called"
496+
"description": "Specifies the type of tool (e.g., 'function')."
497+
},
498+
"function": {
499+
"type": "object",
500+
"description": "Details of the function tool.",
501+
"properties": {
502+
"name": {
503+
"type": "string",
504+
"description": "The name of the tool to be called"
505+
},
506+
"arguments": {
507+
"type": "object",
508+
"description": "The arguments passed to be passed to the tool call request"
509+
}
510+
}
497511
}
498512
}
499513
}

src/content/workers-ai-models/llava-1.5-7b-hf.json

Lines changed: 17 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,23 @@
2727
{
2828
"type": "object",
2929
"properties": {
30+
"image": {
31+
"oneOf": [
32+
{
33+
"type": "array",
34+
"description": "An array of integers that represent the image data constrained to 8-bit unsigned integer values",
35+
"items": {
36+
"type": "number",
37+
"description": "A value between 0 and 255"
38+
}
39+
},
40+
{
41+
"type": "string",
42+
"format": "binary",
43+
"description": "Binary string representing the image contents."
44+
}
45+
]
46+
},
3047
"temperature": {
3148
"type": "number",
3249
"description": "Controls the randomness of the output; higher values produce more random results."
@@ -64,23 +81,6 @@
6481
"type": "number",
6582
"description": "Increases the likelihood of the model introducing new topics."
6683
},
67-
"image": {
68-
"oneOf": [
69-
{
70-
"type": "array",
71-
"description": "An array of integers that represent the image data constrained to 8-bit unsigned integer values",
72-
"items": {
73-
"type": "number",
74-
"description": "A value between 0 and 255"
75-
}
76-
},
77-
{
78-
"type": "string",
79-
"format": "binary",
80-
"description": "Binary string representing the image contents."
81-
}
82-
]
83-
},
8484
"max_tokens": {
8585
"type": "integer",
8686
"default": 512,

src/content/workers-ai-models/meta-llama-3-8b-instruct.json

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -70,8 +70,8 @@
7070
},
7171
"top_p": {
7272
"type": "number",
73-
"minimum": 0,
74-
"maximum": 2,
73+
"minimum": 0.001,
74+
"maximum": 1,
7575
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
7676
},
7777
"top_k": {
@@ -94,13 +94,13 @@
9494
},
9595
"frequency_penalty": {
9696
"type": "number",
97-
"minimum": 0,
97+
"minimum": -2,
9898
"maximum": 2,
9999
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
100100
},
101101
"presence_penalty": {
102102
"type": "number",
103-
"minimum": 0,
103+
"minimum": -2,
104104
"maximum": 2,
105105
"description": "Increases the likelihood of the model introducing new topics."
106106
}
@@ -330,8 +330,8 @@
330330
},
331331
"top_p": {
332332
"type": "number",
333-
"minimum": 0,
334-
"maximum": 2,
333+
"minimum": 0.001,
334+
"maximum": 1,
335335
"description": "Adjusts the creativity of the AI's responses by controlling how many possible words it considers. Lower values make outputs more predictable; higher values allow for more varied and creative responses."
336336
},
337337
"top_k": {
@@ -354,13 +354,13 @@
354354
},
355355
"frequency_penalty": {
356356
"type": "number",
357-
"minimum": 0,
357+
"minimum": -2,
358358
"maximum": 2,
359359
"description": "Decreases the likelihood of the model repeating the same lines verbatim."
360360
},
361361
"presence_penalty": {
362362
"type": "number",
363-
"minimum": 0,
363+
"minimum": -2,
364364
"maximum": 2,
365365
"description": "Increases the likelihood of the model introducing new topics."
366366
}

0 commit comments

Comments
 (0)