Skip to content

Commit a7430a5

Browse files
committed
temp limit for aws bedrock to 1.0
1 parent 09203bb commit a7430a5

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

app/core/model_handlers.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -169,11 +169,11 @@ def _handle_bedrock_request(self, prompt: str, retry_with_reduced_tokens: bool):
169169
}]
170170

171171
inference_config = {
172-
"maxTokens": self.model_params.max_tokens or self.config.get('max_tokens', 8192),
173-
"temperature": self.model_params.temperature,
174-
"topP": self.model_params.top_p,
175-
"stopSequences": ["\n\nHuman:"]
176-
}
172+
"maxTokens": self.model_params.max_tokens or self.config.get('max_tokens', 8192),
173+
"temperature": min(self.model_params.temperature, 1.0),
174+
"topP": self.model_params.top_p,
175+
"stopSequences": ["\n\nHuman:"]
176+
}
177177

178178
response = self.bedrock_client.converse(
179179
modelId=self.model_id,

0 commit comments

Comments
 (0)