Skip to content
This repository was archived by the owner on Sep 10, 2025. It is now read-only.

Commit 82b2adb

Browse files
committed
feat: Add plumbing for Granite 3.0 8b and 3.1 2b/8b
Branch: GraniteThreeDenseSupport Signed-off-by: Gabe Goodhart <[email protected]>
1 parent 6b6b77c commit 82b2adb

File tree

4 files changed

+82
-1
lines changed

4 files changed

+82
-1
lines changed

torchchat/model_config/models.json

Lines changed: 22 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -180,10 +180,31 @@
180180
"tokenizer_file": "tokenizer.json"
181181
},
182182
"ibm-granite/granite-3.0-2b-instruct": {
183-
"aliases": ["granite3-2b"],
183+
"aliases": ["granite3-2b", "granite3"],
184184
"distribution_channel": "HuggingFaceSnapshot",
185185
"distribution_path": "ibm-granite/granite-3.0-2b-instruct",
186186
"transformer_params_key": "Granite-3.0-2B-Instruct",
187187
"tokenizer_file": "tokenizer.json"
188+
},
189+
"ibm-granite/granite-3.0-8b-instruct": {
190+
"aliases": ["granite3-8b"],
191+
"distribution_channel": "HuggingFaceSnapshot",
192+
"distribution_path": "ibm-granite/granite-3.0-8b-instruct",
193+
"transformer_params_key": "Granite-3.0-8B-Instruct",
194+
"tokenizer_file": "tokenizer.json"
195+
},
196+
"ibm-granite/granite-3.1-2b-instruct": {
197+
"aliases": ["granite3.1-2b", "granite3.1"],
198+
"distribution_channel": "HuggingFaceSnapshot",
199+
"distribution_path": "ibm-granite/granite-3.1-2b-instruct",
200+
"transformer_params_key": "Granite-3.1-2B-Instruct",
201+
"tokenizer_file": "tokenizer.json"
202+
},
203+
"ibm-granite/granite-3.1-8b-instruct": {
204+
"aliases": ["granite3.1-8b"],
205+
"distribution_channel": "HuggingFaceSnapshot",
206+
"distribution_path": "ibm-granite/granite-3.1-8b-instruct",
207+
"transformer_params_key": "Granite-3.1-8B-Instruct",
208+
"tokenizer_file": "tokenizer.json"
188209
}
189210
}
Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
{
2+
"attention_multiplier": 0.0078125,
3+
"embedding_multiplier": 12.0,
4+
"dim": 4096,
5+
"block_size": 12800,
6+
"hidden_dim": 12800,
7+
"logits_scaling": 16.0,
8+
"n_heads": 32,
9+
"n_layers": 40,
10+
"n_local_heads": 8,
11+
"residual_multiplier": 0.22,
12+
"norm_eps": 1e-05,
13+
"rope_base": 10000,
14+
"tie_word_embeddings": true,
15+
"vocab_size": 49155,
16+
"use_hf_tokenizer": true,
17+
"tokenizer_prepend_bos": false,
18+
"attention_bias": false,
19+
"feed_forward_bias": false
20+
}
Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
{
2+
"attention_multiplier": 0.015625,
3+
"embedding_multiplier": 12.0,
4+
"dim": 2048,
5+
"block_size": 8192,
6+
"hidden_dim": 8192,
7+
"logits_scaling": 8.0,
8+
"n_heads": 32,
9+
"n_layers": 40,
10+
"n_local_heads": 8,
11+
"residual_multiplier": 0.22,
12+
"norm_eps": 1e-05,
13+
"rope_base": 5000000.0,
14+
"tie_word_embeddings": true,
15+
"vocab_size": 49155,
16+
"use_hf_tokenizer": true,
17+
"tokenizer_prepend_bos": false,
18+
"attention_bias": false,
19+
"feed_forward_bias": false
20+
}
Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
{
2+
"attention_multiplier": 0.0078125,
3+
"embedding_multiplier": 12.0,
4+
"dim": 4096,
5+
"block_size": 12800,
6+
"hidden_dim": 12800,
7+
"logits_scaling": 16.0,
8+
"n_heads": 32,
9+
"n_layers": 40,
10+
"n_local_heads": 8,
11+
"residual_multiplier": 0.22,
12+
"norm_eps": 1e-05,
13+
"rope_base": 10000000.0,
14+
"tie_word_embeddings": true,
15+
"vocab_size": 49155,
16+
"use_hf_tokenizer": true,
17+
"tokenizer_prepend_bos": false,
18+
"attention_bias": false,
19+
"feed_forward_bias": false
20+
}

0 commit comments

Comments
 (0)