File tree Expand file tree Collapse file tree 1 file changed +7
-2
lines changed
server/text_generation_server/models/custom_modeling Expand file tree Collapse file tree 1 file changed +7
-2
lines changed Original file line number Diff line number Diff line change @@ -62,6 +62,7 @@ def __init__(
62
62
pretraining_tp = 1 ,
63
63
tie_word_embeddings = False ,
64
64
rope_scaling = None ,
65
+ rope_theta = 10000.0 ,
65
66
** kwargs ,
66
67
):
67
68
self .vocab_size = vocab_size
@@ -82,6 +83,7 @@ def __init__(
82
83
self .pretraining_tp = pretraining_tp
83
84
self .use_cache = use_cache
84
85
self .rope_scaling = rope_scaling
86
+ self .rope_theta = rope_theta
85
87
86
88
super ().__init__ (
87
89
pad_token_id = pad_token_id ,
@@ -178,8 +180,11 @@ def __init__(
178
180
self .hidden_size = config .hidden_size
179
181
self .head_size = self .hidden_size // self .num_heads
180
182
181
- self .rotary_emb = PositionRotaryEmbedding .load (
182
- prefix = f"{ prefix } .rotary_emb" , weights = weights
183
+ # self.rotary_emb = PositionRotaryEmbedding.load(
184
+ # prefix=f"{prefix}.rotary_emb", weights=weights
185
+ # )
186
+ self .rotary_emb = PositionRotaryEmbedding .static (
187
+ dim = self .head_size , base = config .rope_theta , device = weights .device
183
188
)
184
189
185
190
self .softmax_scale = self .head_size ** - 0.5
You can’t perform that action at this time.
0 commit comments