You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
inputPrice: 0.56,// $0.56 per million tokens (cache miss) - Updated Sept 5, 2025
15
-
outputPrice: 1.68,// $1.68 per million tokens - Updated Sept 5, 2025
16
-
cacheWritesPrice: 0.56,// $0.56 per million tokens (cache miss) - Updated Sept 5, 2025
17
-
cacheReadsPrice: 0.07,// $0.07 per million tokens (cache hit) - Updated Sept 5, 2025
14
+
inputPrice: 0.28,// $0.28 per million tokens (cache miss) - Updated Oct 29, 2025
15
+
outputPrice: 0.42,// $0.42 per million tokens - Updated Oct 29, 2025
16
+
cacheWritesPrice: 0.28,// $0.28 per million tokens (cache miss) - Updated Oct 29, 2025
17
+
cacheReadsPrice: 0.028,// $0.028 per million tokens (cache hit) - Updated Oct 29, 2025
18
18
description: `DeepSeek-V3 achieves a significant breakthrough in inference speed over previous models. It tops the leaderboard among open-source models and rivals the most advanced closed-source models globally.`,
19
19
},
20
20
"deepseek-reasoner": {
21
21
maxTokens: 65536,// 64K max output for reasoning mode
22
22
contextWindow: 128_000,
23
23
supportsImages: false,
24
24
supportsPromptCache: true,
25
-
inputPrice: 0.56,// $0.56 per million tokens (cache miss) - Updated Sept 5, 2025
26
-
outputPrice: 1.68,// $1.68 per million tokens - Updated Sept 5, 2025
27
-
cacheWritesPrice: 0.56,// $0.56 per million tokens (cache miss) - Updated Sept 5, 2025
28
-
cacheReadsPrice: 0.07,// $0.07 per million tokens (cache hit) - Updated Sept 5, 2025
25
+
inputPrice: 0.28,// $0.28 per million tokens (cache miss) - Updated Oct 29, 2025
26
+
outputPrice: 0.42,// $0.42 per million tokens - Updated Oct 29, 2025
27
+
cacheWritesPrice: 0.28,// $0.28 per million tokens (cache miss) - Updated Oct 29, 2025
28
+
cacheReadsPrice: 0.028,// $0.028 per million tokens (cache hit) - Updated Oct 29, 2025
29
29
description: `DeepSeek-R1 achieves performance comparable to OpenAI-o1 across math, code, and reasoning tasks. Supports Chain of Thought reasoning with up to 64K output tokens.`,
0 commit comments