We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
2 parents e1c72fd + 4a077e5 commit ef8084aCopy full SHA for ef8084a
colossalai/shardformer/policies/falcon.py
@@ -246,6 +246,7 @@ def get_held_layers(self) -> List[Module]:
246
module = self.model.transformer
247
stage_manager = self.pipeline_stage_manager
248
held_layers = []
249
+ held_layers.append(module.rotary_emb)
250
if stage_manager.is_interleave:
251
assert stage_manager.num_model_chunks is not None
252
layers_per_stage = stage_manager.distribute_layers(len(module.h))
0 commit comments