File tree Expand file tree Collapse file tree 2 files changed +4
-1
lines changed Expand file tree Collapse file tree 2 files changed +4
-1
lines changed Original file line number Diff line number Diff line change @@ -1069,7 +1069,7 @@ def norm_class(self) -> Type:
1069
1069
sliding_window_size = 512 ,
1070
1070
# 5 local layers for every global layer
1071
1071
sliding_window_indices = [0 if (i + 1 ) % 6 == 0 else 1 for i in range (26 )],
1072
- intermediate_size = 21504 ,
1072
+ intermediate_size = 6912 ,
1073
1073
n_embd = 1152 ,
1074
1074
n_layer = 26 ,
1075
1075
n_head = 4 ,
Original file line number Diff line number Diff line change @@ -602,6 +602,9 @@ def convert_hf_checkpoint(
602
602
elif model_name .lower ().startswith ("gemma-2" ):
603
603
qkv_weights = {}
604
604
copy_fn = partial (copy_weights_gemma_2 , qkv_weights )
605
+ elif model_name .lower ().startswith ("gemma-3" ):
606
+ qkv_weights = {}
607
+ copy_fn = partial (copy_weights_gemma_3 , qkv_weights )
605
608
elif model_name .lower ().startswith ("phi" ):
606
609
# holder to reconstitute the split q, k, v
607
610
qkv_weights = {}
You can’t perform that action at this time.
0 commit comments