We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 8aebfd1 commit 2c674dcCopy full SHA for 2c674dc
keras_hub/src/models/smollm3/smollm3_causal_lm.py
@@ -70,7 +70,7 @@ def call_with_cache(
70
x = self.backbone.token_embedding(token_ids)
71
72
# Each decoder layer has a cache; we update them separately.
73
- position_embeddings = self.backbone.rotary_embedding(x)
+ position_embeddings = self.backbone.rotary_embedding(x, start_index=cache_update_index)
74
updated_cache = []
75
for i in range(self.backbone.num_layers):
76
current_cache = cache[:, i, ...]
0 commit comments