@@ -141,7 +141,8 @@ def generate(
141141 temperature : float = 0.7 ,
142142 top_p : float = 0.9 ,
143143 repetition_penalty : float = 1.15 , # Increased repetition penalty for better quality
144- top_k : int = 80 # Added top_k parameter for better quality
144+ top_k : int = 80 , # Added top_k parameter for better quality
145+ do_sample : bool = True # Added do_sample parameter
145146 ) -> Union [str , Generator [str , None , None ]]:
146147 """
147148 Generate text using the model with improved quality settings.
@@ -171,7 +172,8 @@ def generate(
171172 temperature = temperature ,
172173 top_p = top_p ,
173174 repetition_penalty = repetition_penalty ,
174- top_k = top_k
175+ top_k = top_k ,
176+ do_sample = do_sample
175177 )
176178
177179 return self ._run_coroutine (
@@ -184,6 +186,7 @@ def generate(
184186 top_p = top_p ,
185187 repetition_penalty = repetition_penalty ,
186188 top_k = top_k ,
189+ do_sample = do_sample ,
187190 timeout = 180.0 # Increased timeout for more complete responses (3 minutes)
188191 )
189192 )
@@ -197,7 +200,8 @@ def stream_generate(
197200 top_p : float = 0.9 ,
198201 timeout : float = 300.0 , # Increased timeout for more complete responses (5 minutes)
199202 repetition_penalty : float = 1.15 , # Increased repetition penalty for better quality
200- top_k : int = 80 # Added top_k parameter for better quality
203+ top_k : int = 80 , # Added top_k parameter for better quality
204+ do_sample : bool = True # Added do_sample parameter
201205 ) -> Generator [str , None , None ]:
202206 """
203207 Stream text generation with improved quality and reliability.
@@ -234,7 +238,8 @@ async def producer():
234238 timeout = timeout ,
235239 retry_count = 3 , # Increased retry count for better reliability
236240 repetition_penalty = repetition_penalty , # Pass the repetition penalty parameter
237- top_k = top_k # Pass the top_k parameter
241+ top_k = top_k , # Pass the top_k parameter
242+ do_sample = do_sample # Pass the do_sample parameter
238243 ):
239244 await queue .put (chunk )
240245
0 commit comments