Skip to content

Commit 9eb0333

Browse files
committed
add telechat 2.5
1 parent 6a19ff4 commit 9eb0333

File tree

3 files changed

+18
-1
lines changed

3 files changed

+18
-1
lines changed

convert.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1824,7 +1824,7 @@ def state_dict_pp(cls, config, state_dict):
18241824
def dump_config(f, config, ggml_type):
18251825
assert config.hidden_act is None, 'hidden_act must be None'
18261826
assert not config.tie_word_embeddings, 'tie_word_embeddings must be False'
1827-
assert config.embed_layernorm is None, 'embed_layernorm must be None'
1827+
assert (config.embed_layernorm is None) or not config.embed_layernorm, 'embed_layernorm must be None'
18281828
assert not config.apply_residual_connection_post_layernorm, 'apply_residual_connection_post_layernorm must be False'
18291829
assert config.training_seqlen == config.base_seqlen, 'training_seqlen must equal to base_seqlen'
18301830

docs/models.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -245,6 +245,7 @@
245245

246246
* TeleChat (`TeleChat2ForCausalLM`)
247247
* [x] v2: [3B](https://huggingface.co/Tele-AI/TeleChat2-3B), [7B](https://huggingface.co/Tele-AI/TeleChat2-7B), [115B](https://huggingface.co/Tele-AI/TeleChat2-115B)
248+
* [x] v2.5 [35B](https://huggingface.co/Tele-AI/TeleChat2.5-35B/commit/e53676611f3c5072f7696a359132eaf456272151), [115B](https://huggingface.co/Tele-AI/TeleChat2-115B/tree/8be654fe28bfe60fca4cd483297167a6e570f93b)
248249

249250
* XVERSE (`XverseForCausalLM`)
250251
* [x] [Chat-7B](https://huggingface.co/xverse/XVERSE-7B-Chat), [Chat-13B](https://huggingface.co/xverse/XVERSE-13B-Chat), [Chat-65B](https://huggingface.co/xverse/XVERSE-65B-Chat)

scripts/models.json

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1779,6 +1779,22 @@
17791779
}
17801780
}
17811781
},
1782+
"telechat2.5": {
1783+
"brief": "TeleChat2.5 is a large language model trained by the Artificial Intelligence Research Institute of China Telecom.",
1784+
"default": "35b",
1785+
"license": "Apache License 2.0",
1786+
"variants": {
1787+
"35b": {
1788+
"default": "q4_0",
1789+
"quantized": {
1790+
"q8": {
1791+
"size": 19939670112,
1792+
"url": "chatllm_quantized_telechat/telechat2.5-35b-q4_0.bin"
1793+
}
1794+
}
1795+
}
1796+
}
1797+
},
17821798
"alphageometry-lm": {
17831799
"brief": "TeleChat2 is a large language model trained by the Artificial Intelligence Research Institute of China Telecom.",
17841800
"default": "0.2b",

0 commit comments

Comments
 (0)