Skip to content

Commit 2e380b6

Browse files
committed
Update inference.py
fix the thinking budgets
1 parent 7755946 commit 2e380b6

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

optillm/inference.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1613,31 +1613,31 @@ def get_effort_profile(reasoning_effort: str, max_tokens: int = 4096) -> dict:
16131613
"However,",
16141614
"Additionally,",
16151615
],
1616-
"prefill": "Let me think about this briefly..."
1616+
"prefill": ""
16171617
},
16181618
"medium": {
16191619
"min_tokens_pct": 0.10,
16201620
"max_tokens_pct": 0.66, # 66% of max_tokens
1621-
"max_thoughts": 128,
1621+
"max_thoughts": 256,
16221622
"thought_switch_tokens": [
16231623
"Wait,",
16241624
"Alternatively,",
16251625
"However,",
16261626
"Additionally,",
16271627
],
1628-
"prefill": "Let me analyze this from multiple angles..."
1628+
"prefill": ""
16291629
},
16301630
"high": {
16311631
"min_tokens_pct": 0.10,
16321632
"max_tokens_pct": 0.90, # 90% of max_tokens
1633-
"max_thoughts": 256,
1633+
"max_thoughts": 512,
16341634
"thought_switch_tokens": [
16351635
"Wait,",
16361636
"Alternatively,",
16371637
"However,",
16381638
"Additionally,",
16391639
],
1640-
"prefill": "This requires careful analysis. Let me think through it systematically..."
1640+
"prefill": ""
16411641
}
16421642
}
16431643

0 commit comments

Comments
 (0)