@@ -19,7 +19,10 @@ def normalize_model_params(model_params)
1919 end
2020
2121 def default_options ( dialect )
22- options = { max_tokens : 3_000 , anthropic_version : "bedrock-2023-05-31" }
22+ max_tokens = 4096
23+ max_tokens = 8192 if bedrock_model_id . match? ( /3.5/ )
24+
25+ options = { max_tokens : max_tokens , anthropic_version : "bedrock-2023-05-31" }
2326
2427 options [ :stop_sequences ] = [ "</function_calls>" ] if !dialect . native_tool_support? &&
2528 dialect . prompt . has_tools?
@@ -40,6 +43,27 @@ def xml_tags_to_strip(dialect)
4043
4144 private
4245
46+ def bedrock_model_id
47+ case llm_model . name
48+ when "claude-2"
49+ "anthropic.claude-v2:1"
50+ when "claude-3-haiku"
51+ "anthropic.claude-3-haiku-20240307-v1:0"
52+ when "claude-3-sonnet"
53+ "anthropic.claude-3-sonnet-20240229-v1:0"
54+ when "claude-instant-1"
55+ "anthropic.claude-instant-v1"
56+ when "claude-3-opus"
57+ "anthropic.claude-3-opus-20240229-v1:0"
58+ when "claude-3-5-sonnet"
59+ "anthropic.claude-3-5-sonnet-20241022-v2:0"
60+ when "claude-3-5-haiku"
61+ "anthropic.claude-3-5-haiku-20241022-v1:0"
62+ else
63+ llm_model . name
64+ end
65+ end
66+
4367 def prompt_size ( prompt )
4468 # approximation
4569 tokenizer . size ( prompt . system_prompt . to_s + " " + prompt . messages . to_s )
@@ -48,24 +72,6 @@ def prompt_size(prompt)
4872 def model_uri
4973 region = llm_model . lookup_custom_param ( "region" )
5074
51- bedrock_model_id =
52- case llm_model . name
53- when "claude-2"
54- "anthropic.claude-v2:1"
55- when "claude-3-haiku"
56- "anthropic.claude-3-haiku-20240307-v1:0"
57- when "claude-3-sonnet"
58- "anthropic.claude-3-sonnet-20240229-v1:0"
59- when "claude-instant-1"
60- "anthropic.claude-instant-v1"
61- when "claude-3-opus"
62- "anthropic.claude-3-opus-20240229-v1:0"
63- when "claude-3-5-sonnet"
64- "anthropic.claude-3-5-sonnet-20241022-v2:0"
65- else
66- llm_model . name
67- end
68-
6975 if region . blank? || bedrock_model_id . blank?
7076 raise CompletionFailed . new ( I18n . t ( "discourse_ai.llm_models.bedrock_invalid_url" ) )
7177 end
0 commit comments