Skip to content

Commit 185b2b8

Browse files
committed
Update model pricing and capabilities in JSON configuration
1 parent db2444e commit 185b2b8

File tree

2 files changed

+15
-75
lines changed

2 files changed

+15
-75
lines changed

docs/guides/available-models.md

Lines changed: 6 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -257,7 +257,7 @@ See the [Contributing Guide](https://github.com/crmne/ruby_llm/blob/main/CONTRIB
257257
| Claude Sonnet 4 | us.anthropic.claude-sonnet-4-20250514-v1:0 | bedrock | 200000 | 4096 | In: $0.10, Out: $0.20 |
258258

259259

260-
### Openrouter (319)
260+
### Openrouter (318)
261261

262262
| Model | ID | Provider | Context | Max Output | Standard Pricing (per 1M tokens) |
263263
| :-- | :-- | :-- | --: | --: | :-- |
@@ -524,8 +524,7 @@ See the [Contributing Guide](https://github.com/crmne/ruby_llm/blob/main/CONTRIB
524524
| Qwen: Qwen3 14B (free) | qwen/qwen3-14b:free | openrouter | 40960 | - | - |
525525
| Qwen: Qwen3 235B A22B | qwen/qwen3-235b-a22b | openrouter | 40960 | 40960 | In: $0.13, Out: $0.60 |
526526
| Qwen: Qwen3 235B A22B (free) | qwen/qwen3-235b-a22b:free | openrouter | 131072 | - | - |
527-
| Qwen: Qwen3 235B A22B Instruct 2507 | qwen/qwen3-235b-a22b-2507 | openrouter | 262144 | 262144 | In: $0.12, Out: $0.59 |
528-
| Qwen: Qwen3 235B A22B Instruct 2507 (free) | qwen/qwen3-235b-a22b-2507:free | openrouter | 262144 | - | - |
527+
| Qwen: Qwen3 235B A22B Instruct 2507 | qwen/qwen3-235b-a22b-2507 | openrouter | 262144 | - | In: $0.12, Out: $0.12 |
529528
| Qwen: Qwen3 235B A22B Thinking 2507 | qwen/qwen3-235b-a22b-thinking-2507 | openrouter | 262144 | - | In: $0.12, Out: $0.12 |
530529
| Qwen: Qwen3 30B A3B | qwen/qwen3-30b-a3b | openrouter | 40960 | 40960 | In: $0.08, Out: $0.29 |
531530
| Qwen: Qwen3 30B A3B (free) | qwen/qwen3-30b-a3b:free | openrouter | 40960 | - | - |
@@ -831,7 +830,7 @@ See the [Contributing Guide](https://github.com/crmne/ruby_llm/blob/main/CONTRIB
831830
| Qwen: Qwen3 14B | qwen/qwen3-14b | openrouter | 40960 | - | In: $0.06, Out: $0.24 |
832831
| Qwen: Qwen3 235B A22B | qwen/qwen3-235b-a22b | openrouter | 40960 | 40960 | In: $0.13, Out: $0.60 |
833832
| Qwen: Qwen3 235B A22B (free) | qwen/qwen3-235b-a22b:free | openrouter | 131072 | - | - |
834-
| Qwen: Qwen3 235B A22B Instruct 2507 | qwen/qwen3-235b-a22b-2507 | openrouter | 262144 | 262144 | In: $0.12, Out: $0.59 |
833+
| Qwen: Qwen3 235B A22B Instruct 2507 | qwen/qwen3-235b-a22b-2507 | openrouter | 262144 | - | In: $0.12, Out: $0.12 |
835834
| Qwen: Qwen3 235B A22B Thinking 2507 | qwen/qwen3-235b-a22b-thinking-2507 | openrouter | 262144 | - | In: $0.12, Out: $0.12 |
836835
| Qwen: Qwen3 30B A3B | qwen/qwen3-30b-a3b | openrouter | 40960 | 40960 | In: $0.08, Out: $0.29 |
837836
| Qwen: Qwen3 32B | qwen/qwen3-32b | openrouter | 40960 | - | In: $0.03, Out: $0.03 |
@@ -1111,7 +1110,7 @@ See the [Contributing Guide](https://github.com/crmne/ruby_llm/blob/main/CONTRIB
11111110
| Qwen: Qwen3 14B | qwen/qwen3-14b | openrouter | 40960 | - | In: $0.06, Out: $0.24 |
11121111
| Qwen: Qwen3 235B A22B | qwen/qwen3-235b-a22b | openrouter | 40960 | 40960 | In: $0.13, Out: $0.60 |
11131112
| Qwen: Qwen3 235B A22B (free) | qwen/qwen3-235b-a22b:free | openrouter | 131072 | - | - |
1114-
| Qwen: Qwen3 235B A22B Instruct 2507 | qwen/qwen3-235b-a22b-2507 | openrouter | 262144 | 262144 | In: $0.12, Out: $0.59 |
1113+
| Qwen: Qwen3 235B A22B Instruct 2507 | qwen/qwen3-235b-a22b-2507 | openrouter | 262144 | - | In: $0.12, Out: $0.12 |
11151114
| Qwen: Qwen3 235B A22B Thinking 2507 | qwen/qwen3-235b-a22b-thinking-2507 | openrouter | 262144 | - | In: $0.12, Out: $0.12 |
11161115
| Qwen: Qwen3 30B A3B | qwen/qwen3-30b-a3b | openrouter | 40960 | 40960 | In: $0.08, Out: $0.29 |
11171116
| Qwen: Qwen3 32B | qwen/qwen3-32b | openrouter | 40960 | - | In: $0.03, Out: $0.03 |
@@ -1139,7 +1138,7 @@ See the [Contributing Guide](https://github.com/crmne/ruby_llm/blob/main/CONTRIB
11391138
| xAI: Grok Vision Beta | x-ai/grok-vision-beta | openrouter | 8192 | - | In: $5.00, Out: $15.00 |
11401139

11411140

1142-
### Streaming (395)
1141+
### Streaming (394)
11431142

11441143
| Model | ID | Provider | Context | Max Output | Standard Pricing (per 1M tokens) |
11451144
| :-- | :-- | :-- | --: | --: | :-- |
@@ -1482,8 +1481,7 @@ See the [Contributing Guide](https://github.com/crmne/ruby_llm/blob/main/CONTRIB
14821481
| Qwen: Qwen3 14B (free) | qwen/qwen3-14b:free | openrouter | 40960 | - | - |
14831482
| Qwen: Qwen3 235B A22B | qwen/qwen3-235b-a22b | openrouter | 40960 | 40960 | In: $0.13, Out: $0.60 |
14841483
| Qwen: Qwen3 235B A22B (free) | qwen/qwen3-235b-a22b:free | openrouter | 131072 | - | - |
1485-
| Qwen: Qwen3 235B A22B Instruct 2507 | qwen/qwen3-235b-a22b-2507 | openrouter | 262144 | 262144 | In: $0.12, Out: $0.59 |
1486-
| Qwen: Qwen3 235B A22B Instruct 2507 (free) | qwen/qwen3-235b-a22b-2507:free | openrouter | 262144 | - | - |
1484+
| Qwen: Qwen3 235B A22B Instruct 2507 | qwen/qwen3-235b-a22b-2507 | openrouter | 262144 | - | In: $0.12, Out: $0.12 |
14871485
| Qwen: Qwen3 235B A22B Thinking 2507 | qwen/qwen3-235b-a22b-thinking-2507 | openrouter | 262144 | - | In: $0.12, Out: $0.12 |
14881486
| Qwen: Qwen3 30B A3B | qwen/qwen3-30b-a3b | openrouter | 40960 | 40960 | In: $0.08, Out: $0.29 |
14891487
| Qwen: Qwen3 30B A3B (free) | qwen/qwen3-30b-a3b:free | openrouter | 40960 | - | - |

lib/ruby_llm/models.json

Lines changed: 9 additions & 67 deletions
Original file line numberDiff line numberDiff line change
@@ -18557,16 +18557,16 @@
1855718557
"top_p",
1855818558
"tools",
1855918559
"tool_choice",
18560+
"structured_outputs",
18561+
"response_format",
1856018562
"stop",
1856118563
"frequency_penalty",
1856218564
"presence_penalty",
18563-
"repetition_penalty",
18564-
"response_format",
1856518565
"top_k",
18566-
"seed",
18567-
"min_p",
18568-
"structured_outputs",
18566+
"repetition_penalty",
1856918567
"logit_bias",
18568+
"min_p",
18569+
"seed",
1857018570
"logprobs",
1857118571
"top_logprobs"
1857218572
]
@@ -23845,7 +23845,7 @@
2384523845
"family": "qwen",
2384623846
"created_at": "2025-07-21 19:39:15 +0200",
2384723847
"context_window": 262144,
23848-
"max_output_tokens": 262144,
23848+
"max_output_tokens": null,
2384923849
"knowledge_cutoff": null,
2385023850
"modalities": {
2385123851
"input": [
@@ -23864,8 +23864,8 @@
2386423864
"pricing": {
2386523865
"text_tokens": {
2386623866
"standard": {
23867-
"input_per_million": 0.12,
23868-
"output_per_million": 0.59
23867+
"input_per_million": 0.1179,
23868+
"output_per_million": 0.1179
2386923869
}
2387023870
}
2387123871
},
@@ -23884,7 +23884,7 @@
2388423884
},
2388523885
"top_provider": {
2388623886
"context_length": 262144,
23887-
"max_completion_tokens": 262144,
23887+
"max_completion_tokens": null,
2388823888
"is_moderated": false
2388923889
},
2389023890
"per_request_limits": null,
@@ -23909,64 +23909,6 @@
2390923909
]
2391023910
}
2391123911
},
23912-
{
23913-
"id": "qwen/qwen3-235b-a22b-2507:free",
23914-
"name": "Qwen: Qwen3 235B A22B Instruct 2507 (free)",
23915-
"provider": "openrouter",
23916-
"family": "qwen",
23917-
"created_at": "2025-07-21 19:39:15 +0200",
23918-
"context_window": 262144,
23919-
"max_output_tokens": null,
23920-
"knowledge_cutoff": null,
23921-
"modalities": {
23922-
"input": [
23923-
"text"
23924-
],
23925-
"output": [
23926-
"text"
23927-
]
23928-
},
23929-
"capabilities": [
23930-
"streaming",
23931-
"predicted_outputs"
23932-
],
23933-
"pricing": {},
23934-
"metadata": {
23935-
"description": "Qwen3-235B-A22B-Instruct-2507 is a multilingual, instruction-tuned mixture-of-experts language model based on the Qwen3-235B architecture, with 22B active parameters per forward pass. It is optimized for general-purpose text generation, including instruction following, logical reasoning, math, code, and tool usage. The model supports a native 262K context length and does not implement \"thinking mode\" (<think> blocks).\n\nCompared to its base variant, this version delivers significant gains in knowledge coverage, long-context reasoning, coding benchmarks, and alignment with open-ended tasks. It is particularly strong on multilingual understanding, math reasoning (e.g., AIME, HMMT), and alignment evaluations like Arena-Hard and WritingBench.",
23936-
"architecture": {
23937-
"modality": "text->text",
23938-
"input_modalities": [
23939-
"text"
23940-
],
23941-
"output_modalities": [
23942-
"text"
23943-
],
23944-
"tokenizer": "Qwen3",
23945-
"instruct_type": null
23946-
},
23947-
"top_provider": {
23948-
"context_length": 262144,
23949-
"max_completion_tokens": null,
23950-
"is_moderated": false
23951-
},
23952-
"per_request_limits": null,
23953-
"supported_parameters": [
23954-
"max_tokens",
23955-
"temperature",
23956-
"top_p",
23957-
"stop",
23958-
"frequency_penalty",
23959-
"presence_penalty",
23960-
"seed",
23961-
"top_k",
23962-
"min_p",
23963-
"repetition_penalty",
23964-
"logprobs",
23965-
"logit_bias",
23966-
"top_logprobs"
23967-
]
23968-
}
23969-
},
2397023912
{
2397123913
"id": "qwen/qwen3-235b-a22b-thinking-2507",
2397223914
"name": "Qwen: Qwen3 235B A22B Thinking 2507",

0 commit comments

Comments
 (0)