Skip to content

Commit 30f2aa5

Browse files
committed
Adjust tokens budget calculation in deep thinking tool by reducing an additional 1000 tokens
1 parent 040a6c3 commit 30f2aa5

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

refact-agent/engine/src/tools/tool_deep_thinking.rs

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ async fn _make_prompt(
2828
let caps = try_load_caps_quickly_if_not_present(gcx.clone(), 0).await.map_err(|x| x.message)?;
2929
let tokenizer = cached_tokenizers::cached_tokenizer(caps, gcx.clone(), subchat_params.subchat_model.to_string()).await
3030
.map_err(|e| ScratchError::new(StatusCode::INTERNAL_SERVER_ERROR, format!("Error loading tokenizer: {}", e))).map_err(|x| x.message)?;
31-
let mut tokens_budget: i64 = (subchat_params.subchat_n_ctx - subchat_params.subchat_max_new_tokens - subchat_params.subchat_tokens_for_rag) as i64;
31+
let mut tokens_budget: i64 = (subchat_params.subchat_n_ctx - subchat_params.subchat_max_new_tokens - subchat_params.subchat_tokens_for_rag - 1000) as i64;
3232
let final_message = format!("***Problem:***\n{problem_statement}\n\n***Problem context:***\n");
3333
tokens_budget -= count_tokens(&tokenizer.read().unwrap(), &final_message) as i64;
3434
let mut context = "".to_string();

0 commit comments

Comments
 (0)