Skip to content

Commit 7ead1f5

Browse files
committed
Merge branch 'main' into 04-01-native_inference_billing
2 parents d3880ec + df467d0 commit 7ead1f5

File tree

5 files changed

+228
-130
lines changed

5 files changed

+228
-130
lines changed

.github/workflows/enforce-pnpm.yml

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,17 @@
1+
name: Enforce pnpm
2+
3+
on:
4+
pull_request:
5+
push:
6+
7+
jobs:
8+
reject-npm-lockfile:
9+
runs-on: ubuntu-latest
10+
steps:
11+
- uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
12+
- name: Reject npm lockfiles
13+
run: |
14+
if git ls-files | grep -E '(^|/)package-lock\.json$'; then
15+
echo "Remove package-lock.json and use pnpm."
16+
exit 1
17+
fi

.npmrc

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1 +1,2 @@
11
min-release-age=3
2+
engine-strict=true

package.json

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,13 +7,26 @@
77
"packages/*"
88
],
99
"scripts": {
10+
"preinstall": "node -e \"const userAgent = process.env.npm_config_user_agent || ''; if (process.env.INIT_CWD === process.cwd() && !userAgent.includes('pnpm/')) { console.error('Use pnpm in this repo.'); process.exit(1); }\"",
1011
"build": "turbo run build",
1112
"dev": "turbo run dev",
1213
"start": "turbo run start",
1314
"lint": "turbo run lint",
1415
"clean": "turbo run clean",
1516
"test": "vitest run"
1617
},
18+
"engines": {
19+
"pnpm": ">=10.27.0",
20+
"npm": "please-use-pnpm",
21+
"yarn": "please-use-pnpm"
22+
},
23+
"devEngines": {
24+
"packageManager": {
25+
"name": "pnpm",
26+
"version": ">=10.27.0",
27+
"onFail": "error"
28+
}
29+
},
1730
"devDependencies": {
1831
"eslint": "^8.57.1",
1932
"eslint-config-turbo": "latest",

packages/proxy/schema/model_list.json

Lines changed: 50 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -1492,7 +1492,8 @@
14921492
"max_input_tokens": 131072,
14931493
"max_output_tokens": 32766,
14941494
"available_providers": [
1495-
"groq"
1495+
"groq",
1496+
"together"
14961497
]
14971498
},
14981499
"openai/gpt-oss-20b": {
@@ -1506,7 +1507,8 @@
15061507
"max_input_tokens": 131072,
15071508
"max_output_tokens": 32768,
15081509
"available_providers": [
1509-
"groq"
1510+
"groq",
1511+
"together"
15101512
]
15111513
},
15121514
"accounts/fireworks/models/gpt-oss-120b": {
@@ -2924,6 +2926,7 @@
29242926
"max_input_tokens": 1048576,
29252927
"max_output_tokens": 65536,
29262928
"available_providers": [
2929+
"google",
29272930
"vertex"
29282931
]
29292932
},
@@ -2940,6 +2943,7 @@
29402943
"max_input_tokens": 1048576,
29412944
"max_output_tokens": 65536,
29422945
"available_providers": [
2946+
"google",
29432947
"vertex"
29442948
]
29452949
},
@@ -2956,6 +2960,7 @@
29562960
"max_input_tokens": 1048576,
29572961
"max_output_tokens": 65536,
29582962
"available_providers": [
2963+
"google",
29592964
"vertex"
29602965
]
29612966
},
@@ -2969,10 +2974,11 @@
29692974
"displayName": "Gemini 3 Pro (Preview)",
29702975
"reasoning": true,
29712976
"reasoning_budget": true,
2972-
"deprecation_date": "2026-03-26",
2977+
"deprecation_date": "2026-03-09",
29732978
"max_input_tokens": 1048576,
29742979
"max_output_tokens": 65535,
29752980
"available_providers": [
2981+
"google",
29762982
"vertex"
29772983
]
29782984
},
@@ -2989,7 +2995,8 @@
29892995
"max_input_tokens": 1048576,
29902996
"max_output_tokens": 65535,
29912997
"available_providers": [
2992-
"google"
2998+
"google",
2999+
"vertex"
29933000
]
29943001
},
29953002
"gemini-2.5-flash": {
@@ -3005,6 +3012,7 @@
30053012
"max_input_tokens": 1048576,
30063013
"max_output_tokens": 65535,
30073014
"available_providers": [
3015+
"google",
30083016
"vertex"
30093017
]
30103018
},
@@ -3021,6 +3029,7 @@
30213029
"max_input_tokens": 1048576,
30223030
"max_output_tokens": 65535,
30233031
"available_providers": [
3032+
"google",
30243033
"vertex"
30253034
]
30263035
},
@@ -3038,6 +3047,7 @@
30383047
"max_input_tokens": 1048576,
30393048
"max_output_tokens": 65535,
30403049
"available_providers": [
3050+
"google",
30413051
"vertex"
30423052
]
30433053
},
@@ -3164,6 +3174,7 @@
31643174
"max_input_tokens": 1048576,
31653175
"max_output_tokens": 65535,
31663176
"available_providers": [
3177+
"google",
31673178
"vertex"
31683179
]
31693180
},
@@ -3183,6 +3194,7 @@
31833194
"max_input_tokens": 1048576,
31843195
"max_output_tokens": 65535,
31853196
"available_providers": [
3197+
"google",
31863198
"vertex"
31873199
]
31883200
},
@@ -3199,6 +3211,7 @@
31993211
"max_input_tokens": 1048576,
32003212
"max_output_tokens": 65535,
32013213
"available_providers": [
3214+
"google",
32023215
"vertex"
32033216
]
32043217
},
@@ -3214,21 +3227,23 @@
32143227
"max_input_tokens": 1048576,
32153228
"max_output_tokens": 8192,
32163229
"available_providers": [
3230+
"google",
32173231
"vertex"
32183232
]
32193233
},
32203234
"gemini-2.0-flash-001": {
32213235
"format": "google",
32223236
"flavor": "chat",
32233237
"multimodal": true,
3224-
"input_cost_per_mil_tokens": 0.15,
3225-
"output_cost_per_mil_tokens": 0.6,
3226-
"input_cache_read_cost_per_mil_tokens": 0.0375,
3238+
"input_cost_per_mil_tokens": 0.1,
3239+
"output_cost_per_mil_tokens": 0.4,
3240+
"input_cache_read_cost_per_mil_tokens": 0.025,
32273241
"deprecation_date": "2026-06-01",
32283242
"parent": "gemini-2.0-flash",
32293243
"max_input_tokens": 1048576,
32303244
"max_output_tokens": 8192,
32313245
"available_providers": [
3246+
"google",
32323247
"vertex"
32333248
]
32343249
},
@@ -3244,6 +3259,7 @@
32443259
"max_input_tokens": 1048576,
32453260
"max_output_tokens": 8192,
32463261
"available_providers": [
3262+
"google",
32473263
"vertex"
32483264
]
32493265
},
@@ -3259,6 +3275,7 @@
32593275
"max_input_tokens": 1048576,
32603276
"max_output_tokens": 8192,
32613277
"available_providers": [
3278+
"google",
32623279
"vertex"
32633280
]
32643281
},
@@ -3272,6 +3289,7 @@
32723289
"max_input_tokens": 65536,
32733290
"max_output_tokens": 32768,
32743291
"available_providers": [
3292+
"google",
32753293
"vertex"
32763294
]
32773295
},
@@ -3280,13 +3298,13 @@
32803298
"flavor": "chat",
32813299
"multimodal": true,
32823300
"input_cost_per_mil_tokens": 0.075,
3283-
"output_cost_per_mil_tokens": 0.3,
3301+
"output_cost_per_mil_tokens": 0,
32843302
"displayName": "Gemini 1.5 Flash",
32853303
"deprecation_date": "2025-09-29",
3286-
"max_input_tokens": 1000000,
3304+
"max_input_tokens": 8192,
32873305
"max_output_tokens": 8192,
32883306
"available_providers": [
3289-
"vertex"
3307+
"google"
32903308
]
32913309
},
32923310
"gemini-1.5-flash-latest": {
@@ -3488,12 +3506,13 @@
34883506
"format": "google",
34893507
"flavor": "chat",
34903508
"multimodal": true,
3491-
"input_cost_per_mil_tokens": 0,
3492-
"output_cost_per_mil_tokens": 0,
3509+
"input_cost_per_mil_tokens": 0.3,
3510+
"output_cost_per_mil_tokens": 2.5,
3511+
"input_cache_read_cost_per_mil_tokens": 0.03,
34933512
"experimental": true,
34943513
"deprecated": true,
3495-
"max_input_tokens": 2097152,
3496-
"max_output_tokens": 8192,
3514+
"max_input_tokens": 1048576,
3515+
"max_output_tokens": 65535,
34973516
"available_providers": [
34983517
"google"
34993518
]
@@ -6189,6 +6208,23 @@
61896208
"azure"
61906209
]
61916210
},
6211+
"gpt-5.4-mini-2026-03-17": {
6212+
"format": "openai",
6213+
"flavor": "chat",
6214+
"multimodal": true,
6215+
"input_cost_per_mil_tokens": 0.75,
6216+
"output_cost_per_mil_tokens": 4.5,
6217+
"input_cache_read_cost_per_mil_tokens": 0.075,
6218+
"displayName": "GPT-5.4 mini (2026-03-17)",
6219+
"reasoning": true,
6220+
"parent": "gpt-5.4-mini",
6221+
"max_input_tokens": 400000,
6222+
"max_output_tokens": 128000,
6223+
"available_providers": [
6224+
"openai",
6225+
"azure"
6226+
]
6227+
},
61926228
"gpt-5.4-nano": {
61936229
"format": "openai",
61946230
"flavor": "chat",

0 commit comments

Comments
 (0)