Skip to content

Commit 718b678

Browse files
committed
init
1 parent 50ac90e commit 718b678

File tree

3 files changed

+305
-27
lines changed

3 files changed

+305
-27
lines changed

optillm/inference.py

Lines changed: 10 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1604,30 +1604,33 @@ def get_effort_profile(reasoning_effort: str, max_tokens: int = 4096) -> dict:
16041604
# Base profiles with percentages and thought counts
16051605
profiles = {
16061606
"low": {
1607-
"min_tokens_pct": 0.25, # 25% of max_tokens
1607+
"min_tokens_pct": 0.10,
16081608
"max_tokens_pct": 0.33, # 33% of max_tokens
1609-
"max_thoughts": 4,
1609+
"max_thoughts": 64,
16101610
"thought_switch_tokens": [
16111611
"Wait,",
1612-
"Alternatively,"
1612+
"Alternatively,",
1613+
"However,",
1614+
"Additionally,",
16131615
],
16141616
"prefill": "Let me think about this briefly..."
16151617
},
16161618
"medium": {
1617-
"min_tokens_pct": 0.33, # 33% of max_tokens
1619+
"min_tokens_pct": 0.10,
16181620
"max_tokens_pct": 0.66, # 66% of max_tokens
1619-
"max_thoughts": 8,
1621+
"max_thoughts": 128,
16201622
"thought_switch_tokens": [
16211623
"Wait,",
16221624
"Alternatively,",
16231625
"However,",
1626+
"Additionally,",
16241627
],
16251628
"prefill": "Let me analyze this from multiple angles..."
16261629
},
16271630
"high": {
1628-
"min_tokens_pct": 0.66, # 66% of max_tokens
1631+
"min_tokens_pct": 0.10,
16291632
"max_tokens_pct": 0.90, # 90% of max_tokens
1630-
"max_thoughts": 16,
1633+
"max_thoughts": 256,
16311634
"thought_switch_tokens": [
16321635
"Wait,",
16331636
"Alternatively,",

0 commit comments

Comments
 (0)