Skip to content

Commit b8b3077

Browse files
committed
fix: update sonnet 4 configs to reflect million-context-window pricing
1 parent a74fda1 commit b8b3077

File tree

2 files changed

+108
-48
lines changed

2 files changed

+108
-48
lines changed

litellm/model_prices_and_context_window_backup.json

Lines changed: 54 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -500,10 +500,14 @@
500500
"cache_creation_input_token_cost": 3.75e-06,
501501
"cache_read_input_token_cost": 3e-07,
502502
"input_cost_per_token": 3e-06,
503+
"input_cost_per_token_above_200k_tokens": 6e-06,
504+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
505+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
506+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
503507
"litellm_provider": "bedrock_converse",
504-
"max_input_tokens": 200000,
505-
"max_output_tokens": 64000,
506-
"max_tokens": 64000,
508+
"max_input_tokens": 1000000,
509+
"max_output_tokens": 1000000,
510+
"max_tokens": 1000000,
507511
"mode": "chat",
508512
"output_cost_per_token": 1.5e-05,
509513
"search_context_cost_per_query": {
@@ -764,10 +768,14 @@
764768
"cache_creation_input_token_cost": 3.75e-06,
765769
"cache_read_input_token_cost": 3e-07,
766770
"input_cost_per_token": 3e-06,
771+
"input_cost_per_token_above_200k_tokens": 6e-06,
772+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
773+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
774+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
767775
"litellm_provider": "bedrock_converse",
768-
"max_input_tokens": 200000,
769-
"max_output_tokens": 64000,
770-
"max_tokens": 64000,
776+
"max_input_tokens": 1000000,
777+
"max_output_tokens": 1000000,
778+
"max_tokens": 1000000,
771779
"mode": "chat",
772780
"output_cost_per_token": 1.5e-05,
773781
"search_context_cost_per_query": {
@@ -4727,10 +4735,14 @@
47274735
"cache_creation_input_token_cost_above_1hr": 6e-06,
47284736
"cache_read_input_token_cost": 3e-07,
47294737
"input_cost_per_token": 3e-06,
4738+
"input_cost_per_token_above_200k_tokens": 6e-06,
4739+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
4740+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
4741+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
47304742
"litellm_provider": "anthropic",
4731-
"max_input_tokens": 200000,
4732-
"max_output_tokens": 64000,
4733-
"max_tokens": 64000,
4743+
"max_input_tokens": 1000000,
4744+
"max_output_tokens": 1000000,
4745+
"max_tokens": 1000000,
47344746
"mode": "chat",
47354747
"output_cost_per_token": 1.5e-05,
47364748
"search_context_cost_per_query": {
@@ -7487,10 +7499,14 @@
74877499
"cache_creation_input_token_cost": 3.75e-06,
74887500
"cache_read_input_token_cost": 3e-07,
74897501
"input_cost_per_token": 3e-06,
7502+
"input_cost_per_token_above_200k_tokens": 6e-06,
7503+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
7504+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
7505+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
74907506
"litellm_provider": "bedrock_converse",
7491-
"max_input_tokens": 200000,
7492-
"max_output_tokens": 64000,
7493-
"max_tokens": 64000,
7507+
"max_input_tokens": 1000000,
7508+
"max_output_tokens": 1000000,
7509+
"max_tokens": 1000000,
74947510
"mode": "chat",
74957511
"output_cost_per_token": 1.5e-05,
74967512
"search_context_cost_per_query": {
@@ -16036,10 +16052,12 @@
1603616052
"openrouter/anthropic/claude-sonnet-4": {
1603716053
"input_cost_per_image": 0.0048,
1603816054
"input_cost_per_token": 3e-06,
16055+
"input_cost_per_token_above_200k_tokens": 6e-06,
16056+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
1603916057
"litellm_provider": "openrouter",
16040-
"max_input_tokens": 200000,
16041-
"max_output_tokens": 64000,
16042-
"max_tokens": 64000,
16058+
"max_input_tokens": 1000000,
16059+
"max_output_tokens": 1000000,
16060+
"max_tokens": 1000000,
1604316061
"mode": "chat",
1604416062
"output_cost_per_token": 1.5e-05,
1604516063
"supports_assistant_prefill": true,
@@ -18885,10 +18903,14 @@
1888518903
"cache_creation_input_token_cost": 3.75e-06,
1888618904
"cache_read_input_token_cost": 3e-07,
1888718905
"input_cost_per_token": 3e-06,
18906+
"input_cost_per_token_above_200k_tokens": 6e-06,
18907+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
18908+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
18909+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
1888818910
"litellm_provider": "bedrock_converse",
18889-
"max_input_tokens": 200000,
18890-
"max_output_tokens": 64000,
18891-
"max_tokens": 64000,
18911+
"max_input_tokens": 1000000,
18912+
"max_output_tokens": 1000000,
18913+
"max_tokens": 1000000,
1889218914
"mode": "chat",
1889318915
"output_cost_per_token": 1.5e-05,
1889418916
"search_context_cost_per_query": {
@@ -20221,10 +20243,14 @@
2022120243
"cache_creation_input_token_cost": 3.75e-06,
2022220244
"cache_read_input_token_cost": 3e-07,
2022320245
"input_cost_per_token": 3e-06,
20246+
"input_cost_per_token_above_200k_tokens": 6e-06,
20247+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
20248+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
20249+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
2022420250
"litellm_provider": "vertex_ai-anthropic_models",
20225-
"max_input_tokens": 200000,
20226-
"max_output_tokens": 64000,
20227-
"max_tokens": 64000,
20251+
"max_input_tokens": 1000000,
20252+
"max_output_tokens": 1000000,
20253+
"max_tokens": 1000000,
2022820254
"mode": "chat",
2022920255
"output_cost_per_token": 1.5e-05,
2023020256
"search_context_cost_per_query": {
@@ -20247,10 +20273,14 @@
2024720273
"cache_creation_input_token_cost": 3.75e-06,
2024820274
"cache_read_input_token_cost": 3e-07,
2024920275
"input_cost_per_token": 3e-06,
20276+
"input_cost_per_token_above_200k_tokens": 6e-06,
20277+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
20278+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
20279+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
2025020280
"litellm_provider": "vertex_ai-anthropic_models",
20251-
"max_input_tokens": 200000,
20252-
"max_output_tokens": 64000,
20253-
"max_tokens": 64000,
20281+
"max_input_tokens": 1000000,
20282+
"max_output_tokens": 1000000,
20283+
"max_tokens": 1000000,
2025420284
"mode": "chat",
2025520285
"output_cost_per_token": 1.5e-05,
2025620286
"search_context_cost_per_query": {

model_prices_and_context_window.json

Lines changed: 54 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -500,10 +500,14 @@
500500
"cache_creation_input_token_cost": 3.75e-06,
501501
"cache_read_input_token_cost": 3e-07,
502502
"input_cost_per_token": 3e-06,
503+
"input_cost_per_token_above_200k_tokens": 6e-06,
504+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
505+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
506+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
503507
"litellm_provider": "bedrock_converse",
504-
"max_input_tokens": 200000,
505-
"max_output_tokens": 64000,
506-
"max_tokens": 64000,
508+
"max_input_tokens": 1000000,
509+
"max_output_tokens": 1000000,
510+
"max_tokens": 1000000,
507511
"mode": "chat",
508512
"output_cost_per_token": 1.5e-05,
509513
"search_context_cost_per_query": {
@@ -764,10 +768,14 @@
764768
"cache_creation_input_token_cost": 3.75e-06,
765769
"cache_read_input_token_cost": 3e-07,
766770
"input_cost_per_token": 3e-06,
771+
"input_cost_per_token_above_200k_tokens": 6e-06,
772+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
773+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
774+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
767775
"litellm_provider": "bedrock_converse",
768-
"max_input_tokens": 200000,
769-
"max_output_tokens": 64000,
770-
"max_tokens": 64000,
776+
"max_input_tokens": 1000000,
777+
"max_output_tokens": 1000000,
778+
"max_tokens": 1000000,
771779
"mode": "chat",
772780
"output_cost_per_token": 1.5e-05,
773781
"search_context_cost_per_query": {
@@ -4727,10 +4735,14 @@
47274735
"cache_creation_input_token_cost_above_1hr": 6e-06,
47284736
"cache_read_input_token_cost": 3e-07,
47294737
"input_cost_per_token": 3e-06,
4738+
"input_cost_per_token_above_200k_tokens": 6e-06,
4739+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
4740+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
4741+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
47304742
"litellm_provider": "anthropic",
4731-
"max_input_tokens": 200000,
4732-
"max_output_tokens": 64000,
4733-
"max_tokens": 64000,
4743+
"max_input_tokens": 1000000,
4744+
"max_output_tokens": 1000000,
4745+
"max_tokens": 1000000,
47344746
"mode": "chat",
47354747
"output_cost_per_token": 1.5e-05,
47364748
"search_context_cost_per_query": {
@@ -7487,10 +7499,14 @@
74877499
"cache_creation_input_token_cost": 3.75e-06,
74887500
"cache_read_input_token_cost": 3e-07,
74897501
"input_cost_per_token": 3e-06,
7502+
"input_cost_per_token_above_200k_tokens": 6e-06,
7503+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
7504+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
7505+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
74907506
"litellm_provider": "bedrock_converse",
7491-
"max_input_tokens": 200000,
7492-
"max_output_tokens": 64000,
7493-
"max_tokens": 64000,
7507+
"max_input_tokens": 1000000,
7508+
"max_output_tokens": 1000000,
7509+
"max_tokens": 1000000,
74947510
"mode": "chat",
74957511
"output_cost_per_token": 1.5e-05,
74967512
"search_context_cost_per_query": {
@@ -16036,10 +16052,12 @@
1603616052
"openrouter/anthropic/claude-sonnet-4": {
1603716053
"input_cost_per_image": 0.0048,
1603816054
"input_cost_per_token": 3e-06,
16055+
"input_cost_per_token_above_200k_tokens": 6e-06,
16056+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
1603916057
"litellm_provider": "openrouter",
16040-
"max_input_tokens": 200000,
16041-
"max_output_tokens": 64000,
16042-
"max_tokens": 64000,
16058+
"max_input_tokens": 1000000,
16059+
"max_output_tokens": 1000000,
16060+
"max_tokens": 1000000,
1604316061
"mode": "chat",
1604416062
"output_cost_per_token": 1.5e-05,
1604516063
"supports_assistant_prefill": true,
@@ -18885,10 +18903,14 @@
1888518903
"cache_creation_input_token_cost": 3.75e-06,
1888618904
"cache_read_input_token_cost": 3e-07,
1888718905
"input_cost_per_token": 3e-06,
18906+
"input_cost_per_token_above_200k_tokens": 6e-06,
18907+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
18908+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
18909+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
1888818910
"litellm_provider": "bedrock_converse",
18889-
"max_input_tokens": 200000,
18890-
"max_output_tokens": 64000,
18891-
"max_tokens": 64000,
18911+
"max_input_tokens": 1000000,
18912+
"max_output_tokens": 1000000,
18913+
"max_tokens": 1000000,
1889218914
"mode": "chat",
1889318915
"output_cost_per_token": 1.5e-05,
1889418916
"search_context_cost_per_query": {
@@ -20221,10 +20243,14 @@
2022120243
"cache_creation_input_token_cost": 3.75e-06,
2022220244
"cache_read_input_token_cost": 3e-07,
2022320245
"input_cost_per_token": 3e-06,
20246+
"input_cost_per_token_above_200k_tokens": 6e-06,
20247+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
20248+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
20249+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
2022420250
"litellm_provider": "vertex_ai-anthropic_models",
20225-
"max_input_tokens": 200000,
20226-
"max_output_tokens": 64000,
20227-
"max_tokens": 64000,
20251+
"max_input_tokens": 1000000,
20252+
"max_output_tokens": 1000000,
20253+
"max_tokens": 1000000,
2022820254
"mode": "chat",
2022920255
"output_cost_per_token": 1.5e-05,
2023020256
"search_context_cost_per_query": {
@@ -20247,10 +20273,14 @@
2024720273
"cache_creation_input_token_cost": 3.75e-06,
2024820274
"cache_read_input_token_cost": 3e-07,
2024920275
"input_cost_per_token": 3e-06,
20276+
"input_cost_per_token_above_200k_tokens": 6e-06,
20277+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
20278+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
20279+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
2025020280
"litellm_provider": "vertex_ai-anthropic_models",
20251-
"max_input_tokens": 200000,
20252-
"max_output_tokens": 64000,
20253-
"max_tokens": 64000,
20281+
"max_input_tokens": 1000000,
20282+
"max_output_tokens": 1000000,
20283+
"max_tokens": 1000000,
2025420284
"mode": "chat",
2025520285
"output_cost_per_token": 1.5e-05,
2025620286
"search_context_cost_per_query": {

0 commit comments

Comments
 (0)