Skip to content

Commit 2074d71

Browse files
committed
Update LLM model examples
1 parent 9c0a237 commit 2074d71

File tree

1 file changed

+35
-35
lines changed

1 file changed

+35
-35
lines changed

app/_data/plugins/ai-proxy.yaml

Lines changed: 35 additions & 35 deletions
Original file line numberDiff line numberDiff line change
@@ -98,21 +98,21 @@ providers:
9898
streaming: true
9999
upstream_path: '/v1/messages'
100100
route_type: 'llm/v1/chat'
101-
model_example: 'claude-3-opus-20240229'
101+
model_example: 'claude-sonnet-4-20250514'
102102
min_version: '3.6'
103103
completions:
104104
supported: true
105105
streaming: false
106106
upstream_path: '/v1/complete'
107107
route_type: 'llm/v1/completions'
108-
model_example: 'claude-2.1'
108+
model_example: 'claude-sonnet-4-20250514'
109109
min_version: '3.6'
110110
function_calling:
111111
supported: true
112112
streaming: false
113113
upstream_path: '/v1/messages'
114114
route_type: 'llm/v1/chat'
115-
model_example: 'claude-3-opus-20240229'
115+
model_example: 'claude-sonnet-4-20250514'
116116
min_version: '3.6'
117117
batches:
118118
supported: true
@@ -143,30 +143,30 @@ providers:
143143
streaming: true
144144
upstream_path: '/openai/deployments/{deployment_name}/chat/completions'
145145
route_type: 'llm/v1/chat'
146-
model_example: 'gpt-4'
146+
model_example: 'gpt-4o'
147147
min_version: '3.6'
148148
completions:
149149
supported: true
150150
streaming: true
151151
upstream_path: '/openai/deployments/{deployment_name}/completions'
152152
route_type: 'llm/v1/completions'
153-
model_example: 'gpt-3.5-turbo-instruct'
153+
model_example: 'gpt-4o-mini'
154154
min_version: '3.6'
155155
embeddings:
156156
supported: true
157157
streaming: false
158158
upstream_path: '/openai/deployments/{deployment_name}/embeddings'
159159
route_type: 'llm/v1/embeddings'
160-
model_example: 'text-embedding-ada-002<sup>1</sup>'
160+
model_example: 'text-embedding-3-small'
161161
min_version: '3.11'
162162
note:
163-
content: 'The `text-embedding-ada-002` model requires a fixed dimension of 1536. Use `text-embedding-3-small` for dynamic dimensions.'
163+
content: 'Use `text-embedding-3-small` or `text-embedding-3-large` for dynamic dimensions.'
164164
function_calling:
165165
supported: true
166166
streaming: false
167167
upstream_path: '/openai/deployments/{deployment_name}/chat/completions'
168168
route_type: 'llm/v1/chat'
169-
model_example: 'gpt-4'
169+
model_example: 'gpt-4o'
170170
min_version: '3.6'
171171
files:
172172
supported: true
@@ -268,7 +268,7 @@ providers:
268268
streaming: true
269269
upstream_path: '/v1/chat/completions'
270270
route_type: 'llm/v1/chat'
271-
model_example: 'llama3.1-8b'
271+
model_example: 'llama-3.3-70b'
272272
min_version: '3.13'
273273
limitations:
274274
provider_specific: []
@@ -283,14 +283,14 @@ providers:
283283
streaming: true
284284
upstream_path: '/v1/chat'
285285
route_type: 'llm/v1/chat'
286-
model_example: 'command'
286+
model_example: 'command-a-03-2025'
287287
min_version: '3.6'
288288
completions:
289289
supported: true
290290
streaming: true
291291
upstream_path: '/v1/generate'
292292
route_type: 'llm/v1/completions'
293-
model_example: 'command'
293+
model_example: 'command-r-plus-08-2024'
294294
min_version: '3.6'
295295
embeddings:
296296
supported: true
@@ -304,7 +304,7 @@ providers:
304304
streaming: false
305305
upstream_path: '/v1/chat'
306306
route_type: 'llm/v1/chat'
307-
model_example: 'command-r-plus'
307+
model_example: 'command-a-03-2025'
308308
min_version: '3.6'
309309
native_formats:
310310
- llm_format: 'cohere'
@@ -362,7 +362,7 @@ providers:
362362
streaming: true
363363
upstream_path: 'Uses <code>generateContent</code> API'
364364
route_type: 'llm/v1/chat'
365-
model_example: 'gemini-2.0-flash'
365+
model_example: 'gemini-2.5-flash'
366366
min_version: '3.8'
367367
embeddings:
368368
supported: true
@@ -376,7 +376,7 @@ providers:
376376
streaming: false
377377
upstream_path: 'Uses <code>generateContent</code> API with function declarations'
378378
route_type: 'llm/v1/chat'
379-
model_example: 'gemini-2.0-flash'
379+
model_example: 'gemini-2.5-flash'
380380
min_version: '3.8'
381381
files:
382382
supported: true
@@ -402,21 +402,21 @@ providers:
402402
streaming: false
403403
upstream_path: 'Uses <code>generateContent</code> API'
404404
route_type: 'image/v1/images/generations'
405-
model_example: 'gemini-2.0-flash-preview-image-generation<sup>1</sup>'
405+
model_example: 'gemini-2.5-flash-preview-image-generation'
406406
min_version: '3.11'
407407
edits:
408408
supported: true
409409
streaming: false
410410
upstream_path: 'Uses <code>generateContent</code> API'
411411
route_type: 'image/v1/images/edits'
412-
model_example: 'gemini-2.0-flash-preview-image-generation<sup>1</sup>'
412+
model_example: 'gemini-2.5-flash-preview-image-generation'
413413
min_version: '3.11'
414414
realtime:
415415
supported: true
416416
streaming: true
417417
upstream_path: 'Uses <code>BidiGenerateContent</code> API'
418418
route_type: 'realtime/v1/realtime'
419-
model_example: 'gemini-live-2.5-flash-preview-native-audio-09-2025'
419+
model_example: 'gemini-2.5-flash-preview-native-audio'
420420
min_version: '3.13'
421421
note:
422422
content: 'Realtime processing for Gemini is supported in the native format from SDK only'
@@ -452,14 +452,14 @@ providers:
452452
streaming: true
453453
upstream_path: 'Uses <code>generateContent</code> API'
454454
route_type: 'llm/v1/chat'
455-
model_example: 'gemini-2.0-flash'
455+
model_example: 'gemini-2.5-flash'
456456
min_version: '3.8'
457457
completions:
458458
supported: true
459459
streaming: false
460460
upstream_path: 'Uses <code>generateContent</code> API'
461461
route_type: 'llm/v1/completions'
462-
model_example: 'gemini-2.0-flash'
462+
model_example: 'gemini-2.5-flash'
463463
min_version: '3.8'
464464
embeddings:
465465
supported: true
@@ -473,7 +473,7 @@ providers:
473473
streaming: false
474474
upstream_path: 'Uses <code>generateContent</code> API with function declarations'
475475
route_type: 'llm/v1/chat'
476-
model_example: 'gemini-2.0-flash'
476+
model_example: 'gemini-2.5-flash'
477477
min_version: '3.8'
478478
files:
479479
supported: true
@@ -497,14 +497,14 @@ providers:
497497
streaming: false
498498
upstream_path: 'Uses <code>generateContent</code> API'
499499
route_type: 'image/v1/images/generations'
500-
model_example: 'gemini-2.0-flash-preview-image-generation<sup>1</sup>'
500+
model_example: 'gemini-2.5-flash-preview-image-generation'
501501
min_version: '3.11'
502502
edits:
503503
supported: true
504504
streaming: false
505505
upstream_path: 'Uses <code>generateContent</code> API'
506506
route_type: 'image/v1/images/edits'
507-
model_example: 'gemini-2.0-flash-preview-image-generation<sup>1</sup>'
507+
model_example: 'gemini-2.5-flash-preview-image-generation'
508508
min_version: '3.11'
509509
video:
510510
generations:
@@ -606,7 +606,7 @@ providers:
606606
streaming: true
607607
upstream_path: '/v1/chat/completions or user-defined'
608608
route_type: 'llm/v1/chat'
609-
model_example: 'mistral-tiny'
609+
model_example: 'mistral-large-latest'
610610
min_version: '3.6'
611611
embeddings:
612612
supported: true
@@ -627,7 +627,7 @@ providers:
627627
statistics_logging: []
628628

629629
- name: 'OpenAI'
630-
formats: 'GPT-3.5, GPT-4, GPT-4o, and Multi-Modal'
630+
formats: 'GPT-4o, GPT-4.1, and Multi-Modal'
631631
url_patterns:
632632
- 'https://api.openai.com:443/{route_type_path}'
633633
min_version: '3.6'
@@ -636,30 +636,30 @@ providers:
636636
streaming: true
637637
upstream_path: '/v1/chat/completions'
638638
route_type: 'llm/v1/chat'
639-
model_example: 'gpt-4'
639+
model_example: 'gpt-4o'
640640
min_version: '3.6'
641641
completions:
642642
supported: true
643643
streaming: true
644644
upstream_path: '/v1/completions'
645645
route_type: 'llm/v1/completions'
646-
model_example: 'gpt-3.5-turbo-instruct'
646+
model_example: 'gpt-4o-mini'
647647
min_version: '3.6'
648648
embeddings:
649649
supported: true
650650
streaming: false
651651
upstream_path: '/v1/embeddings'
652652
route_type: 'llm/v1/embeddings'
653-
model_example: 'text-embedding-ada-002'
653+
model_example: 'text-embedding-3-small'
654654
min_version: '3.11'
655655
note:
656-
content: 'The `text-embedding-ada-002` model requires a fixed dimension of 1536. Use `text-embedding-3-small` for dynamic dimensions.'
656+
content: 'Use `text-embedding-3-small` or `text-embedding-3-large` for dynamic dimensions.'
657657
function_calling:
658658
supported: true
659659
streaming: false
660660
upstream_path: '/v1/chat/completions'
661661
route_type: 'llm/v1/chat'
662-
model_example: 'gpt-4'
662+
model_example: 'gpt-4o'
663663
min_version: '3.6'
664664
files:
665665
supported: true
@@ -680,7 +680,7 @@ providers:
680680
streaming: false
681681
upstream_path: '/v1/assistants'
682682
route_type: 'llm/v1/assistants'
683-
model_example: 'gpt-4-1106-preview'
683+
model_example: 'gpt-4o'
684684
min_version: '3.11'
685685
note:
686686
content: 'Requires header <code>OpenAI-Beta: assistants=v2</code>'
@@ -689,7 +689,7 @@ providers:
689689
streaming: false
690690
upstream_path: '/v1/responses'
691691
route_type: 'llm/v1/responses'
692-
model_example: 'gpt-4-1106-preview'
692+
model_example: 'gpt-4o'
693693
min_version: '3.11'
694694
audio:
695695
speech:
@@ -733,7 +733,7 @@ providers:
733733
streaming: true
734734
upstream_path: '/v1/realtime'
735735
route_type: 'realtime/v1/realtime'
736-
model_example: 'gpt-4o'
736+
model_example: 'gpt-4o-realtime-preview'
737737
min_version: '3.11'
738738
note:
739739
content: 'For requests to OpenAI realtime API, include include the header `OpenAI-Beta: realtime=v1`.'
@@ -759,7 +759,7 @@ providers:
759759
streaming: false
760760
upstream_path: '/v1/chat/completions'
761761
route_type: 'llm/v1/chat'
762-
model_example: 'grok-4'
762+
model_example: 'grok-3'
763763
min_version: '3.13'
764764
completions:
765765
supported: false
@@ -772,7 +772,7 @@ providers:
772772
streaming: false
773773
upstream_path: '/v1/chat/completions'
774774
route_type: 'llm/v1/chat'
775-
model_example: 'grok-2-latest'
775+
model_example: 'grok-3'
776776
min_version: '3.13'
777777
files:
778778
supported: false
@@ -788,7 +788,7 @@ providers:
788788
streaming: false
789789
upstream_path: '/v1/responses'
790790
route_type: 'llm/v1/responses'
791-
model_example: 'gpt-4'
791+
model_example: 'grok-3'
792792
min_version: '3.13'
793793
audio:
794794
speech:

0 commit comments

Comments
 (0)