We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent a5943b3 commit 221a879Copy full SHA for 221a879
QEfficient/transformers/models/modeling_auto.py
@@ -3333,8 +3333,6 @@ def compile(
3333
ccl_lengths = self.comp_ctx_lengths_decode if prefill_seq_len == 1 else self.comp_ctx_lengths_prefill
3334
# Adding elements from self.comp_ctx_lengths_prefill to prefill_specialization
3335
for i in range(0, len(ccl_lengths)):
3336
- # if prefill_only or enable_chunking:
3337
- # raise NotImplementedError("prefill_only or enable_chunking is not supported with CCL")
3338
specializations.append(
3339
self.build_prefill_specialization(
3340
prefill_seq_len=prefill_seq_len,
0 commit comments