We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 6253c6b + 8922741 commit 9b908fbCopy full SHA for 9b908fb
model.py
@@ -65,7 +65,7 @@ def from_name(cls, name: str):
65
"Mistral-7B": dict(n_layer=32, n_head=32, n_local_heads=8, dim=4096, intermediate_size=14336, vocab_size=32000),
66
"stories15M": dict(n_layer=6, n_head=6, dim=288),
67
"stories110M": dict(n_layer=12, n_head=12, dim=768),
68
- "Llama-3-8B": dict(block_size=8192, n_layer=32, n_head=32, n_local_heads=8, dim=4096, intermediate_size=14336, vocab_size=128256),
+ "Llama-3-8B": dict(block_size=8192, n_layer=32, n_head=32, n_local_heads=8, dim=4096, intermediate_size=14336, vocab_size=128256, rope_base=500000),
69
}
70
71
class KVCache(nn.Module):
0 commit comments