8484 "gpt2-chatbot" ,
8585 "im-also-a-good-gpt2-chatbot" ,
8686 "im-a-good-gpt2-chatbot" ,
87+ "gpt-4o-mini-2024-07-18" ,
8788 "gpt-4o-2024-05-13" ,
89+ "gpt-4o-2024-08-06" ,
90+ "chatgpt-4o-latest-20240903" ,
91+ "chatgpt-4o-latest" ,
92+ "o1-preview" ,
93+ "o1-mini" ,
8894)
8995
9096
@@ -1118,8 +1124,20 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
11181124 return get_conv_template ("gpt-4-turbo-2024-04-09" )
11191125 if "gpt2-chatbot" in model_path :
11201126 return get_conv_template ("gpt-4-turbo-2024-04-09" )
1121- if "gpt-4o" in model_path :
1127+ if "gpt-4o-2024-05-13 " in model_path :
11221128 return get_conv_template ("gpt-4-turbo-2024-04-09" )
1129+ if "gpt-4o-2024-08-06" in model_path :
1130+ return get_conv_template ("gpt-mini" )
1131+ if "anonymous-chatbot" in model_path :
1132+ return get_conv_template ("gpt-4-turbo-2024-04-09" )
1133+ if "chatgpt-4o-latest" in model_path :
1134+ return get_conv_template ("gpt-4-turbo-2024-04-09" )
1135+ if "gpt-mini" in model_path :
1136+ return get_conv_template ("gpt-mini" )
1137+ if "gpt-4o-mini-2024-07-18" in model_path :
1138+ return get_conv_template ("gpt-mini" )
1139+ if "o1" in model_path :
1140+ return get_conv_template ("api_based_default" )
11231141 return get_conv_template ("chatgpt" )
11241142
11251143
@@ -1167,7 +1185,7 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
11671185 if "claude-3-sonnet" in model_path :
11681186 return get_conv_template ("claude-3-sonnet-20240229" )
11691187 if "claude-3-5-sonnet" in model_path :
1170- return get_conv_template ("claude-3-5-sonnet-20240620" )
1188+ return get_conv_template ("claude-3-5-sonnet-20240620-v2 " )
11711189 if "claude-3-opus" in model_path :
11721190 return get_conv_template ("claude-3-opus-20240229" )
11731191 return get_conv_template ("claude" )
@@ -1212,19 +1230,6 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
12121230 return get_conv_template ("gemini" )
12131231
12141232
1215- class GeminiDevAdapter (BaseModelAdapter ):
1216- """The model adapter for Gemini 1.5 Pro"""
1217-
1218- def match (self , model_path : str ):
1219- return "gemini-1.5-pro" in model_path .lower ()
1220-
1221- def load_model (self , model_path : str , from_pretrained_kwargs : dict ):
1222- raise NotImplementedError ()
1223-
1224- def get_default_conv_template (self , model_path : str ) -> Conversation :
1225- return get_conv_template ("gemini-dev" )
1226-
1227-
12281233class BiLLaAdapter (BaseModelAdapter ):
12291234 """The model adapter for Neutralzz/BiLLa-7B-SFT"""
12301235
@@ -1575,7 +1580,7 @@ class Llama3Adapter(BaseModelAdapter):
15751580 """The model adapter for Llama-3 (e.g., meta-llama/Meta-Llama-3-8B-Instruct)"""
15761581
15771582 def match (self , model_path : str ):
1578- return "llama-3" in model_path .lower ()
1583+ return "llama-3- " in model_path .lower ()
15791584
15801585 def load_model (self , model_path : str , from_pretrained_kwargs : dict ):
15811586 model , tokenizer = super ().load_model (model_path , from_pretrained_kwargs )
@@ -1587,6 +1592,43 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
15871592 return get_conv_template ("llama-3" )
15881593
15891594
1595+ class Llama31Adapter (BaseModelAdapter ):
1596+ """The model adapter for Llama-3 (e.g., meta-llama/Meta-Llama-3-8B-Instruct)"""
1597+
1598+ def match (self , model_path : str ):
1599+ keywords = [
1600+ "llama-3.1" ,
1601+ ]
1602+ for keyword in keywords :
1603+ if keyword in model_path .lower ():
1604+ return True
1605+
1606+ def load_model (self , model_path : str , from_pretrained_kwargs : dict ):
1607+ model , tokenizer = super ().load_model (model_path , from_pretrained_kwargs )
1608+ model .config .eos_token_id = tokenizer .eos_token_id
1609+ model .config .pad_token_id = tokenizer .pad_token_id
1610+ return model , tokenizer
1611+
1612+ def get_default_conv_template (self , model_path : str ) -> Conversation :
1613+ if model_path .lower () in [
1614+ "llama-3.1-8b-instruct" ,
1615+ "llama-3.1-70b-instruct" ,
1616+ "the-real-chatbot-v2" ,
1617+ ]:
1618+ return get_conv_template ("meta-llama-3.1-sp" )
1619+ return get_conv_template ("meta-llama-3.1" )
1620+
1621+
1622+ class GrokAdapter (BaseModelAdapter ):
1623+ def match (self , model_path : str ):
1624+ return "grok" in model_path .lower ()
1625+
1626+ def get_default_conv_template (self , model_path : str ) -> Conversation :
1627+ if "mini" in model_path .lower ():
1628+ return get_conv_template ("grok-2-mini" )
1629+ return get_conv_template ("grok-2" )
1630+
1631+
15901632class CuteGPTAdapter (BaseModelAdapter ):
15911633 """The model adapter for CuteGPT"""
15921634
@@ -2445,6 +2487,19 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
24452487 return get_conv_template ("api_based_default" )
24462488
24472489
2490+ class NoSystemAdapter (BaseModelAdapter ):
2491+ def match (self , model_path : str ):
2492+ keyword_list = ["athene-70b" ]
2493+
2494+ for keyword in keyword_list :
2495+ if keyword == model_path .lower ():
2496+ return True
2497+ return False
2498+
2499+ def get_default_conv_template (self , model_path : str ) -> Conversation :
2500+ return get_conv_template ("api_based_default" )
2501+
2502+
24482503# Note: the registration order matters.
24492504# The one registered earlier has a higher matching priority.
24502505register_model_adapter (PeftModelAdapter )
@@ -2470,7 +2525,6 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
24702525register_model_adapter (BardAdapter )
24712526register_model_adapter (PaLM2Adapter )
24722527register_model_adapter (GeminiAdapter )
2473- register_model_adapter (GeminiDevAdapter )
24742528register_model_adapter (GemmaAdapter )
24752529register_model_adapter (ChatGPTAdapter )
24762530register_model_adapter (AzureOpenAIAdapter )
@@ -2545,6 +2599,9 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
25452599register_model_adapter (RekaAdapter )
25462600register_model_adapter (SmaugChatAdapter )
25472601register_model_adapter (Llama3Adapter )
2602+ register_model_adapter (Llama31Adapter )
2603+ register_model_adapter (GrokAdapter )
2604+ register_model_adapter (NoSystemAdapter )
25482605
25492606# After all adapters, try the default base adapter.
25502607register_model_adapter (BaseModelAdapter )
0 commit comments