You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
feat(deepseek): enhance model support with prompt caching and detailed usage metrics
- Add support for prompt caching in DeepSeek models
- Update model configurations to reflect caching capabilities
- Implement detailed usage metrics tracking cache write and read tokens
- Extend test coverage for new usage metrics and model parameters
- Update pricing information for DeepSeek models to include cache-related costs
inputPrice: 0.27,// $0.27 per million tokens (cache miss)
819
+
outputPrice: 1.1,// $1.10 per million tokens
820
+
cacheWritesPrice: 0.27,// $0.27 per million tokens (cache miss)
821
+
cacheReadsPrice: 0.07,// $0.07 per million tokens (cache hit)
820
822
description: `DeepSeek-V3 achieves a significant breakthrough in inference speed over previous models. It tops the leaderboard among open-source models and rivals the most advanced closed-source models globally.`,
821
823
},
822
824
"deepseek-reasoner": {
823
825
maxTokens: 8192,
824
826
contextWindow: 64_000,
825
827
supportsImages: false,
826
-
supportsPromptCache: false,
827
-
inputPrice: 0.55,// $0.55 per million tokens
828
+
supportsPromptCache: true,
829
+
inputPrice: 0.55,// $0.55 per million tokens (cache miss)
828
830
outputPrice: 2.19,// $2.19 per million tokens
829
-
description: `DeepSeek-R1 achieves performance comparable to OpenAI-o1 across math, code, and reasoning tasks.`,
831
+
cacheWritesPrice: 0.55,// $0.55 per million tokens (cache miss)
832
+
cacheReadsPrice: 0.14,// $0.14 per million tokens (cache hit)
833
+
thinking: true,// Supports Chain of Thought with 32K tokens
834
+
description: `DeepSeek-R1 achieves performance comparable to OpenAI-o1 across math, code, and reasoning tasks. Supports Chain of Thought reasoning with up to 32K tokens.`,
0 commit comments