Skip to content

Commit a8d33eb

Browse files
committed
increase genamt hardlimit from 0.1 to 0.2 ratio
1 parent 40443a9 commit a8d33eb

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

koboldcpp.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1384,7 +1384,7 @@ def generate(genparams, stream_flag=False):
13841384
print(f"\n!!! ====== !!!\n(Warning! Request max_context_length={max_context_length} exceeds allocated context size of {maxctx}. It will be reduced to fit. Consider launching with increased --contextsize to avoid issues. This message will only show once per session.)\n!!! ====== !!!")
13851385
showmaxctxwarning = False
13861386
max_context_length = maxctx
1387-
min_remain_hardlimit = max(min(max_context_length-4, 16),int(max_context_length*0.1))
1387+
min_remain_hardlimit = max(min(max_context_length-4, 16),int(max_context_length*0.2))
13881388
min_remain_softlimit = max(min(max_context_length-4, 16),int(max_context_length*0.4))
13891389
if max_length >= (max_context_length-min_remain_softlimit):
13901390
print(f"\n!!! ====== !!!\nWarning: You are trying to generate text with max_length ({max_length}) near or exceeding max_context_length limit ({max_context_length}).\nMost of the context will be removed, and your outputs will not be very coherent.\nConsider launching with increased --contextsize to avoid issues.\n!!! ====== !!!")

0 commit comments

Comments
 (0)