|
1492 | 1492 | "max_input_tokens": 131072, |
1493 | 1493 | "max_output_tokens": 32766, |
1494 | 1494 | "available_providers": [ |
1495 | | - "groq" |
| 1495 | + "groq", |
| 1496 | + "together" |
1496 | 1497 | ] |
1497 | 1498 | }, |
1498 | 1499 | "openai/gpt-oss-20b": { |
|
1506 | 1507 | "max_input_tokens": 131072, |
1507 | 1508 | "max_output_tokens": 32768, |
1508 | 1509 | "available_providers": [ |
1509 | | - "groq" |
| 1510 | + "groq", |
| 1511 | + "together" |
1510 | 1512 | ] |
1511 | 1513 | }, |
1512 | 1514 | "accounts/fireworks/models/gpt-oss-120b": { |
|
2924 | 2926 | "max_input_tokens": 1048576, |
2925 | 2927 | "max_output_tokens": 65536, |
2926 | 2928 | "available_providers": [ |
| 2929 | + "google", |
2927 | 2930 | "vertex" |
2928 | 2931 | ] |
2929 | 2932 | }, |
|
2940 | 2943 | "max_input_tokens": 1048576, |
2941 | 2944 | "max_output_tokens": 65536, |
2942 | 2945 | "available_providers": [ |
| 2946 | + "google", |
2943 | 2947 | "vertex" |
2944 | 2948 | ] |
2945 | 2949 | }, |
|
2956 | 2960 | "max_input_tokens": 1048576, |
2957 | 2961 | "max_output_tokens": 65536, |
2958 | 2962 | "available_providers": [ |
| 2963 | + "google", |
2959 | 2964 | "vertex" |
2960 | 2965 | ] |
2961 | 2966 | }, |
|
2969 | 2974 | "displayName": "Gemini 3 Pro (Preview)", |
2970 | 2975 | "reasoning": true, |
2971 | 2976 | "reasoning_budget": true, |
2972 | | - "deprecation_date": "2026-03-26", |
| 2977 | + "deprecation_date": "2026-03-09", |
2973 | 2978 | "max_input_tokens": 1048576, |
2974 | 2979 | "max_output_tokens": 65535, |
2975 | 2980 | "available_providers": [ |
| 2981 | + "google", |
2976 | 2982 | "vertex" |
2977 | 2983 | ] |
2978 | 2984 | }, |
|
2989 | 2995 | "max_input_tokens": 1048576, |
2990 | 2996 | "max_output_tokens": 65535, |
2991 | 2997 | "available_providers": [ |
2992 | | - "google" |
| 2998 | + "google", |
| 2999 | + "vertex" |
2993 | 3000 | ] |
2994 | 3001 | }, |
2995 | 3002 | "gemini-2.5-flash": { |
|
3005 | 3012 | "max_input_tokens": 1048576, |
3006 | 3013 | "max_output_tokens": 65535, |
3007 | 3014 | "available_providers": [ |
| 3015 | + "google", |
3008 | 3016 | "vertex" |
3009 | 3017 | ] |
3010 | 3018 | }, |
|
3021 | 3029 | "max_input_tokens": 1048576, |
3022 | 3030 | "max_output_tokens": 65535, |
3023 | 3031 | "available_providers": [ |
| 3032 | + "google", |
3024 | 3033 | "vertex" |
3025 | 3034 | ] |
3026 | 3035 | }, |
|
3038 | 3047 | "max_input_tokens": 1048576, |
3039 | 3048 | "max_output_tokens": 65535, |
3040 | 3049 | "available_providers": [ |
| 3050 | + "google", |
3041 | 3051 | "vertex" |
3042 | 3052 | ] |
3043 | 3053 | }, |
|
3164 | 3174 | "max_input_tokens": 1048576, |
3165 | 3175 | "max_output_tokens": 65535, |
3166 | 3176 | "available_providers": [ |
| 3177 | + "google", |
3167 | 3178 | "vertex" |
3168 | 3179 | ] |
3169 | 3180 | }, |
|
3183 | 3194 | "max_input_tokens": 1048576, |
3184 | 3195 | "max_output_tokens": 65535, |
3185 | 3196 | "available_providers": [ |
| 3197 | + "google", |
3186 | 3198 | "vertex" |
3187 | 3199 | ] |
3188 | 3200 | }, |
|
3199 | 3211 | "max_input_tokens": 1048576, |
3200 | 3212 | "max_output_tokens": 65535, |
3201 | 3213 | "available_providers": [ |
| 3214 | + "google", |
3202 | 3215 | "vertex" |
3203 | 3216 | ] |
3204 | 3217 | }, |
|
3214 | 3227 | "max_input_tokens": 1048576, |
3215 | 3228 | "max_output_tokens": 8192, |
3216 | 3229 | "available_providers": [ |
| 3230 | + "google", |
3217 | 3231 | "vertex" |
3218 | 3232 | ] |
3219 | 3233 | }, |
3220 | 3234 | "gemini-2.0-flash-001": { |
3221 | 3235 | "format": "google", |
3222 | 3236 | "flavor": "chat", |
3223 | 3237 | "multimodal": true, |
3224 | | - "input_cost_per_mil_tokens": 0.15, |
3225 | | - "output_cost_per_mil_tokens": 0.6, |
3226 | | - "input_cache_read_cost_per_mil_tokens": 0.0375, |
| 3238 | + "input_cost_per_mil_tokens": 0.1, |
| 3239 | + "output_cost_per_mil_tokens": 0.4, |
| 3240 | + "input_cache_read_cost_per_mil_tokens": 0.025, |
3227 | 3241 | "deprecation_date": "2026-06-01", |
3228 | 3242 | "parent": "gemini-2.0-flash", |
3229 | 3243 | "max_input_tokens": 1048576, |
3230 | 3244 | "max_output_tokens": 8192, |
3231 | 3245 | "available_providers": [ |
| 3246 | + "google", |
3232 | 3247 | "vertex" |
3233 | 3248 | ] |
3234 | 3249 | }, |
|
3244 | 3259 | "max_input_tokens": 1048576, |
3245 | 3260 | "max_output_tokens": 8192, |
3246 | 3261 | "available_providers": [ |
| 3262 | + "google", |
3247 | 3263 | "vertex" |
3248 | 3264 | ] |
3249 | 3265 | }, |
|
3259 | 3275 | "max_input_tokens": 1048576, |
3260 | 3276 | "max_output_tokens": 8192, |
3261 | 3277 | "available_providers": [ |
| 3278 | + "google", |
3262 | 3279 | "vertex" |
3263 | 3280 | ] |
3264 | 3281 | }, |
|
3272 | 3289 | "max_input_tokens": 65536, |
3273 | 3290 | "max_output_tokens": 32768, |
3274 | 3291 | "available_providers": [ |
| 3292 | + "google", |
3275 | 3293 | "vertex" |
3276 | 3294 | ] |
3277 | 3295 | }, |
|
3280 | 3298 | "flavor": "chat", |
3281 | 3299 | "multimodal": true, |
3282 | 3300 | "input_cost_per_mil_tokens": 0.075, |
3283 | | - "output_cost_per_mil_tokens": 0.3, |
| 3301 | + "output_cost_per_mil_tokens": 0, |
3284 | 3302 | "displayName": "Gemini 1.5 Flash", |
3285 | 3303 | "deprecation_date": "2025-09-29", |
3286 | | - "max_input_tokens": 1000000, |
| 3304 | + "max_input_tokens": 8192, |
3287 | 3305 | "max_output_tokens": 8192, |
3288 | 3306 | "available_providers": [ |
3289 | | - "vertex" |
| 3307 | + "google" |
3290 | 3308 | ] |
3291 | 3309 | }, |
3292 | 3310 | "gemini-1.5-flash-latest": { |
|
3488 | 3506 | "format": "google", |
3489 | 3507 | "flavor": "chat", |
3490 | 3508 | "multimodal": true, |
3491 | | - "input_cost_per_mil_tokens": 0, |
3492 | | - "output_cost_per_mil_tokens": 0, |
| 3509 | + "input_cost_per_mil_tokens": 0.3, |
| 3510 | + "output_cost_per_mil_tokens": 2.5, |
| 3511 | + "input_cache_read_cost_per_mil_tokens": 0.03, |
3493 | 3512 | "experimental": true, |
3494 | 3513 | "deprecated": true, |
3495 | | - "max_input_tokens": 2097152, |
3496 | | - "max_output_tokens": 8192, |
| 3514 | + "max_input_tokens": 1048576, |
| 3515 | + "max_output_tokens": 65535, |
3497 | 3516 | "available_providers": [ |
3498 | 3517 | "google" |
3499 | 3518 | ] |
|
6189 | 6208 | "azure" |
6190 | 6209 | ] |
6191 | 6210 | }, |
| 6211 | + "gpt-5.4-mini-2026-03-17": { |
| 6212 | + "format": "openai", |
| 6213 | + "flavor": "chat", |
| 6214 | + "multimodal": true, |
| 6215 | + "input_cost_per_mil_tokens": 0.75, |
| 6216 | + "output_cost_per_mil_tokens": 4.5, |
| 6217 | + "input_cache_read_cost_per_mil_tokens": 0.075, |
| 6218 | + "displayName": "GPT-5.4 mini (2026-03-17)", |
| 6219 | + "reasoning": true, |
| 6220 | + "parent": "gpt-5.4-mini", |
| 6221 | + "max_input_tokens": 400000, |
| 6222 | + "max_output_tokens": 128000, |
| 6223 | + "available_providers": [ |
| 6224 | + "openai", |
| 6225 | + "azure" |
| 6226 | + ] |
| 6227 | + }, |
6192 | 6228 | "gpt-5.4-nano": { |
6193 | 6229 | "format": "openai", |
6194 | 6230 | "flavor": "chat", |
|
0 commit comments